From d457fba87eab4cd8103412e4457c0befe1ab0e3d Mon Sep 17 00:00:00 2001 From: Micha Moskovic Date: Mon, 11 Dec 2023 10:20:23 +0100 Subject: [PATCH] hep: add material to FFT for CDS --- inspire_dojson/hep/rules/bdFFT.py | 5 ++- tests/test_hep_bdFFT.py | 63 +++++++++++++++++++++++++++++++ 2 files changed, 67 insertions(+), 1 deletion(-) diff --git a/inspire_dojson/hep/rules/bdFFT.py b/inspire_dojson/hep/rules/bdFFT.py index 0164e0fc..bded0913 100644 --- a/inspire_dojson/hep/rules/bdFFT.py +++ b/inspire_dojson/hep/rules/bdFFT.py @@ -123,7 +123,10 @@ def _get_hidden(value): return None def _get_filename_and_extension(value): - return os.path.splitext(value.get('filename', value['key'])) + file_name, extension = os.path.splitext(value.get('filename', value['key'])) + if file_name == "document" and value.get("material", "publication") != "publication": + file_name = value["material"] + return file_name, extension file_name, extension = _get_filename_and_extension(value) diff --git a/tests/test_hep_bdFFT.py b/tests/test_hep_bdFFT.py index a2c4a723..40c6bb12 100644 --- a/tests/test_hep_bdFFT.py +++ b/tests/test_hep_bdFFT.py @@ -468,6 +468,69 @@ def test_documents_to_FFT_uses_filename(): assert expected == result['FFT'] +def test_documents_to_FFT_uses_material_as_filename_fallback(): + schema = load_schema('hep') + subschema = schema['properties']['documents'] + + snippet = { + "documents": [ + { + "key": "8f09853e5bc12d6d077ba0833e97626e", + "url": "https://inspirehep.net/files/8f09853e5bc12d6d077ba0833e97626e", + "source": "Springer", + "fulltext": True, + "filename": "document", + "material": "addendum", + }, + { + "key": "35715635c16bc869b4995e150b140bf8", + "url": "https://inspirehep.net/files/35715635c16bc869b4995e150b140bf8", + "hidden": True, + "source": "arxiv", + "filename": "2103.11769.pdf", + "fulltext": True, + "material": "preprint", + "original_url": "http://export.arxiv.org/pdf/2103.11769", + }, + { + "key": "277ff3946ce757cba86a4ab4ebb95287", + "url": "https://inspirehep.net/files/277ff3946ce757cba86a4ab4ebb95287", + "filename": "document", + "fulltext": True, + "material": "publication", + } + ], + } # literature/1852846 + + expected = [ + { + "a": "https://inspirehep.net/files/8f09853e5bc12d6d077ba0833e97626e", + "d": "Fulltext", + "n": "addendum", + "t": "Springer", + }, + { + "a": "https://inspirehep.net/files/35715635c16bc869b4995e150b140bf8", + "d": "Fulltext", + "n": "2103.11769", + "t": "arXiv", + "f": ".pdf", + }, + { + "a": "https://inspirehep.net/files/277ff3946ce757cba86a4ab4ebb95287", + "d": "Fulltext", + "n": "document", + "t": "INSPIRE-PUBLIC", + } + ] + + assert validate(snippet['documents'], subschema) is None + + result = hep2marc.do(snippet) + + assert expected == result['FFT'] + + def test_figures_to_FFT(): schema = load_schema('hep') subschema = schema['properties']['figures']