Skip to content
Snippets Groups Projects
create_bib_file.py 5.54 KiB
Newer Older
Bas Nijholt's avatar
Bas Nijholt committed
# Adapted from https://gitlab.kwant-project.org/qt/basnijholt/thesis-bas-nijholt/blob/master/create_bib_file.py

import functools
import glob
import os
from concurrent.futures import ThreadPoolExecutor

import requests
import yaml


Bas Nijholt's avatar
Bas Nijholt committed
def edit_raw_bibtex_entry(key, bib_entry):
Bas Nijholt's avatar
Bas Nijholt committed
    bib_type, *_ = bib_entry.split("{")
    _, *rest = bib_entry.split(",")
    rest = ",".join(rest)
    # Now only modify `rest` because we don't want to touch the key.

    # XXX: I am not sure whether these substitutions are needed.
    # the problem seemed to be the utf-8 `requests.get` encoding.
    to_replace = [("ö", r"\"{o}"), ("ü", r"\"{u}"), ("ë", r"\"{e}"), ("ï", r"\"{i}")]

    for old, new in to_replace:
        rest = rest.replace(old.upper(), new.upper())
        rest = rest.replace(old.lower(), new.lower())

    to_replace = [
        (r"a{\r}", r"\r{a}"),  # "Nyga{\r}rd" -> "Nyg\r{a}rd", bug in doi.org
        ("Josephson", "{J}osephson"),
        ("Majorana", "{M}ajorana"),
        ("Andreev", "{A}ndreev"),
        ("Kramers", "{K}ramers"),
        ("Kitaev", "{K}itaev"),
Bas Nijholt's avatar
Bas Nijholt committed
        (r"{JornHoofwijk}", "Hoofwijk, Jorn"),  # fix for 10.5281/Zenodo.1182437
        (
            "NIRA DYN and DAVID LEVIN and SAMUEL RIPPA",
            "Nira Dyn and David Levin and Samuel Rippa",
        ),  # fix for  10.1093/imanum/10.1.137
Bas Nijholt's avatar
Bas Nijholt committed
        (
            r"metastable0and$\uppi$states",
            r"metastable $0$ and $\pi$ states",
        ),  # fix for 10.1103/physrevb.63.214512
        (
            r"Land{\'{e}}{gFactors}",
            r"Land{\'{e}} {$g$} Factors",
        ),  # fix for PhysRevLett.96.026804
    ]

    journals = [
        ("Advanced Materials", "Adv. Mater."),
        ("Annals of Physics", "Ann. Phys."),
        ("Applied Physics Letters", "Appl. Phys. Lett."),
        ("JETP Lett", "JETP Lett."),
        ("Journal de Physique", "J. Phys."),
        ("Journal of Computational Physics", "J. Comput. Phys."),
        ("Journal of Experimental and Theoretical Physics", "J. Exp. Theor. Phys."),
        ("Journal of Low Temperature Physics", "J. Low Temp. Phys."),
        (
            "Journal of Physics A: Mathematical and Theoretical",
            "J. Phys. A: Math. Theor.",
        ),
        ("Journal of Physics: Condensed Matter", "J. Phys.: Condens. Matter"),
        ("Nano Letters", "Nano Lett."),
        ("Nature Communications", "Nat. Commun."),
        ("Nature Materials", "Nat. Mater."),
        ("Nature Nanotechnology", "Nat. Nanotechnol."),
        ("Nature Physics", "Nat. Phys."),
        ("New Journal of Physics", "New J. Phys."),
        ("Physical Review B", "Phys. Rev. B"),
        ("Physical Review Letters", "Phys. Rev. Lett."),
        ("Physical Review X", "Phys. Rev. X"),
        ("Physical Review", "Phys. Rev."),  # should be before the above subs
        ("Physics-Uspekhi", "Phys. Usp."),
        ("Reports on Progress in Physics", "Rep. Prog. Phys."),
        ("Review of Scientific Instruments", "Rev. Sci. Instrum."),
        ("Reviews of Modern Physics", "Rev. Mod. Phys."),
        ("Science Advances", "Sci. Adv."),
        ("Scientific Reports", "Sci. Rep."),
        ("Semiconductor Science and Technology", "Semicond. Sci. Technol."),
        (
            "Annual Review of Condensed Matter Physics",
            "Annu. Rev. Condens. Matter Phys.",
        ),
        ("{EPL} (Europhysics Letters)", "{EPL}"),
        ("Nature Reviews Materials", "Nat. Rev. Mater."),
        ("Physics Letters", "Phys. Lett."),
        ("The European Physical Journal B", "Eur. Phys. J. B"),
        ("{SIAM} Journal on Numerical Analysis", "{SIAM} J. Numer. Anal."),
        ("{AIP} Conference Proceedings", "{AIP} Conf. Proc."),
Bas Nijholt's avatar
Bas Nijholt committed
        ("{ACM} Transactions on Graphics", "{ACM} Trans. Graph."),
        ("Measurement Science and Technology", "Meas. Sci. Technol"),
        ("Numerische Mathematik", "Numer. Math."),
        ("{IMA} Journal of Numerical Analysis", "{IMA} J. Appl. Math."),
        ("{ACM} Transactions on Mathematical Software", "{ACM} Trans. Math. Softw."),
        ("Journal of Computational and Applied Mathematics", "J. Comput. Appl. Math"),
        ("{SciPost} Physics", "{SciPost} Phys."),
        ("Computer Graphics Forum", "Comput. Graphics Forum"),
Bas Nijholt's avatar
Bas Nijholt committed
    ]

    for old, new in to_replace + journals:
        rest = rest.replace(old, new)

    result = bib_type + "{" + key + "," + rest

    print(result, "\n")
    return result


@functools.lru_cache()
def doi2bib(doi):
    """Return a bibTeX string of metadata for a given DOI."""
    url = "http://dx.doi.org/" + doi
    headers = {"accept": "application/x-bibtex"}
    r = requests.get(url, headers=headers)
    r.encoding = "utf-8"
    return r.text


Bas Nijholt's avatar
Bas Nijholt committed
fname_bib = "paper.yaml"
print("Reading: ", fname_bib)
Bas Nijholt's avatar
Bas Nijholt committed
with open(fname_bib) as f:
Bas Nijholt's avatar
Bas Nijholt committed
    dois = yaml.safe_load(f)
dois = dict(sorted(dois.items()))
Bas Nijholt's avatar
Bas Nijholt committed


with ThreadPoolExecutor() as ex:
    futs = ex.map(doi2bib, list(dois.values()))
    bibs = list(futs)


Bas Nijholt's avatar
Bas Nijholt committed
entries = [edit_raw_bibtex_entry(key, bib) for key, bib in zip(dois.keys(), bibs)]
Bas Nijholt's avatar
Bas Nijholt committed

Bas Nijholt's avatar
Bas Nijholt committed
with open("paper.bib", "w") as out_file:
Bas Nijholt's avatar
Bas Nijholt committed
    fname_other = "not_on_crossref.bib"
Bas Nijholt's avatar
Bas Nijholt committed
    out_file.write("% Created automatically with `python create_bib_file.py`.\n\n")
Bas Nijholt's avatar
Bas Nijholt committed
    out_file.write("@preamble{ {\\providecommand{\\BIBYu}{Yu} } }\n\n")
Bas Nijholt's avatar
Bas Nijholt committed
    out_file.write(f"\n% Below is from `{fname_other}`.\n\n")
    with open(fname_other) as in_file:
Bas Nijholt's avatar
Bas Nijholt committed
        out_file.write(in_file.read())
Bas Nijholt's avatar
Bas Nijholt committed
    out_file.write(f"\n% Below is from `{fname_bib}`.\n\n")
Bas Nijholt's avatar
Bas Nijholt committed
    for e in entries:
Bas Nijholt's avatar
Bas Nijholt committed
        for line in e.split("\n"):
Bas Nijholt's avatar
Bas Nijholt committed
            # Remove the url line
            if "url = {" not in line:
Bas Nijholt's avatar
Bas Nijholt committed
                out_file.write(f"{line}\n")
        out_file.write("\n")