__init__.py 2.1 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273
  1. """
  2. Generate BibTeX Entries for PubMed Publications
  3. This module utilizes the API of TeXMed,
  4. a BibTeX interface for PubMed.
  5. TeXMed was written by Arne Muller
  6. https://www.bioinformatics.org/texmed/
  7. Command Line Example:
  8. $ pubmed-bibtex 31025164
  9. @Article{pmid31025164,
  10. Author="...",
  11. Title="...",
  12. Journal="...",
  13. ...
  14. }
  15. Python Example:
  16. >>> from pubmed_bibtex import bibtex_entry_from_pmid
  17. >>> print(bibtex_entry_from_pmid(123456789))
  18. Copyright (C) 2019 Fabian Peter Hammerle <fabian@hammerle.me>
  19. This program is free software: you can redistribute it and/or modify
  20. it under the terms of the GNU General Public License as published by
  21. the Free Software Foundation, either version 3 of the License, or
  22. (at your option) any later version.
  23. This program is distributed in the hope that it will be useful,
  24. but WITHOUT ANY WARRANTY; without even the implied warranty of
  25. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  26. GNU General Public License for more details.
  27. You should have received a copy of the GNU General Public License
  28. along with this program. If not, see <https://www.gnu.org/licenses/>.
  29. """
  30. import html.parser
  31. import re
  32. import requests
  33. from pubmed_bibtex.version import __version__
  34. _TEXMED_URL_PATTERN = 'https://www.bioinformatics.org/texmed/cgi-bin' \
  35. '/list.cgi?PMID={pmid}&linkOut'
  36. class _TeXMedHtmlParser(html.parser.HTMLParser):
  37. def __init__(self):
  38. self.bibtex_entry = None
  39. super().__init__()
  40. @staticmethod
  41. def _strip_bibtex_entry(data: str) -> str:
  42. return re.sub(r'\n\% \d+\s?\n', '', data).strip() + '\n'
  43. def handle_data(self, data: str) -> None:
  44. if 'Author' in data:
  45. self.bibtex_entry = self._strip_bibtex_entry(data)
  46. def error(self, message) -> None:
  47. raise Exception(message) # pragma: no cover
  48. def bibtex_entry_from_pmid(pmid: str) -> str:
  49. assert pmid.isdigit(), pmid
  50. resp = requests.get(_TEXMED_URL_PATTERN.format(pmid=pmid))
  51. resp.raise_for_status()
  52. parser = _TeXMedHtmlParser()
  53. parser.feed(resp.text)
  54. return parser.bibtex_entry