diff --git a/docker-compose.yml b/docker-compose.yml index 919c868852..acb34df5a4 100644 --- a/docker-compose.yml +++ b/docker-compose.yml @@ -311,11 +311,14 @@ services: pgpool: restart: "always" - image: bitnami/pgpool + image: pgpool/pgpool:4.2.2 environment: - - PGPOOL_BACKEND_NODES=0:postgresql:5432 - - PGPOOL_SR_CHECK_USER=invenio - - PGPOOL_SR_CHECK_PASSWORD=dbpass123 + - PGPOOL_PARAMS_BACKEND_HOSTNAME0=postgresql + - PGPOOL_PARAMS_BACKEND_PORT0=5432 + - PGPOOL_PARAMS_BACKEND_WEIGHT0=1 + - PGPOOL_PARAMS_SR_CHECK_USER=invenio + - PGPOOL_PARAMS_SR_CHECK_PASSWORD=dbpass123 + - PGPOOL_PARAMS_PORT=5432 - PGPOOL_ENABLE_LDAP=no - PGPOOL_POSTGRES_USERNAME=postgres - PGPOOL_POSTGRES_PASSWORD=dbpass123 @@ -452,4 +455,3 @@ volumes: mongo_data: # letsencrypt_etc: # letsencrypt_html: - diff --git a/docker-compose2.yml b/docker-compose2.yml index baf22a20a4..3868cc5792 100644 --- a/docker-compose2.yml +++ b/docker-compose2.yml @@ -311,11 +311,14 @@ services: pgpool: restart: "always" - image: bitnami/pgpool + image: pgpool/pgpool:4.2.2 environment: - - PGPOOL_BACKEND_NODES=0:postgresql:5432 - - PGPOOL_SR_CHECK_USER=invenio - - PGPOOL_SR_CHECK_PASSWORD=dbpass123 + - PGPOOL_PARAMS_BACKEND_HOSTNAME0=postgresql + - PGPOOL_PARAMS_BACKEND_PORT0=5432 + - PGPOOL_PARAMS_BACKEND_WEIGHT0=1 + - PGPOOL_PARAMS_SR_CHECK_USER=invenio + - PGPOOL_PARAMS_SR_CHECK_PASSWORD=dbpass123 + - PGPOOL_PARAMS_PORT=5432 - PGPOOL_ENABLE_LDAP=no - PGPOOL_POSTGRES_USERNAME=postgres - PGPOOL_POSTGRES_PASSWORD=dbpass123 @@ -452,4 +455,3 @@ volumes: mongo_data: # letsencrypt_etc: # letsencrypt_html: - diff --git a/modules/weko-accounts/weko_accounts/utils.py b/modules/weko-accounts/weko_accounts/utils.py index eae9eab191..7dd2ede02a 100644 --- a/modules/weko-accounts/weko_accounts/utils.py +++ b/modules/weko-accounts/weko_accounts/utils.py @@ -30,7 +30,6 @@ import hashlib from .config import WEKO_API_LIMIT_RATE_DEFAULT -from weko_admin.models import AdminSettings limiter = Limiter( app=None, @@ -111,6 +110,7 @@ def parse_attributes(): error = False # Get attribute mapping from admin settings + from weko_admin.models import AdminSettings admin_settings = AdminSettings.get('attribute_mapping', dict_to_object=False) for header, attr in current_app.config[ @@ -221,7 +221,7 @@ def decorated_view(*args, **kwargs): def get_sp_info(): """Get Service Provider (SP) information for Shibboleth login. - + Returns: dict: A dictionary containing SP entityID, handlerURL, and return URL. """ @@ -233,7 +233,7 @@ def get_sp_info(): sp_entityID = 'https://' + current_app.config['WEB_HOST_NAME'] + '/shibboleth-sp' if 'SP_ENTITYID' in current_app.config: sp_entityID = current_app.config['SP_ENTITYID'] - + sp_handlerURL = 'https://' + current_app.config['WEB_HOST_NAME'] + '/Shibboleth.sso' if 'SP_HANDLERURL' in current_app.config: sp_handlerURL = current_app.config['SP_HANDLERURL'] diff --git a/modules/weko-deposit/requirements2.txt b/modules/weko-deposit/requirements2.txt index 3c30c7d8a7..f203b6675a 100644 --- a/modules/weko-deposit/requirements2.txt +++ b/modules/weko-deposit/requirements2.txt @@ -287,3 +287,4 @@ xmlschema==0.9.30 xmltodict==0.12.0 zipp==3.6.0 zope.interface==5.5.2 +pypdfium2==4.30.0 diff --git a/modules/weko-deposit/tests/data/test_files/sample_word.docx b/modules/weko-deposit/tests/data/test_files/sample_word.docx new file mode 100644 index 0000000000..6de626ae06 Binary files /dev/null and b/modules/weko-deposit/tests/data/test_files/sample_word.docx differ diff --git a/modules/weko-deposit/tests/test_utils.py b/modules/weko-deposit/tests/test_utils.py index a48feffb22..2b017a018e 100644 --- a/modules/weko-deposit/tests/test_utils.py +++ b/modules/weko-deposit/tests/test_utils.py @@ -19,12 +19,14 @@ # MA 02111-1307, USA. from weko_deposit.api import WekoDeposit -from weko_deposit.utils import update_pdf_contents_es +from weko_deposit.utils import update_pdf_contents_es, extract_text_from_pdf, extract_text_with_tika from mock import patch +from mock import MagicMock import uuid from tests.helpers import create_record_with_pdf - +import os +import pytest # .tox/c1/bin/pytest --cov=weko_deposit tests/test_utils.py::test_update_pdf_contents_es -vv -s --cov-branch --cov-report=term --basetemp=/code/modules/weko-deposit/.tox/c1/tmp def test_update_pdf_contents_es(app, db, location, mocker): @@ -46,4 +48,57 @@ def test_update_pdf_contents_es(app, db, location, mocker): for args, _ in args_list: test = pdf_file_infos[i] assert args[0] == (test,str(record_ids[i])) - i+=1 \ No newline at end of file + i+=1 + + +# .tox/c1/bin/pytest --cov=weko_deposit tests/test_utils.py::test_extract_text_from_pdf -vv -s --cov-branch --cov-report=term --basetemp=/code/modules/weko-deposit/.tox/c1/tmp +def test_extract_text_from_pdf(): + filepath = os.path.join(os.path.dirname(__file__),"data","test_files","test_file_1.2M.pdf") + + # file size > max_size + data = extract_text_from_pdf(filepath, 10000) + assert len(data.encode('utf-8')) <= 10000 + assert data.count("test file page") < 1240 + + # file size <= max_size + data = extract_text_from_pdf(filepath, 100000000) + assert len(data.encode('utf-8')) == 19561 + assert data.count("test file page") == 1240 + + # not exist file + filepath = "not_exist_file.pdf" + with pytest.raises(FileNotFoundError) as e: + data = extract_text_from_pdf(filepath, 10000) + assert str(e.value) == "/code/modules/weko-deposit/not_exist_file.pdf" + + +# .tox/c1/bin/pytest --cov=weko_deposit tests/test_utils.py::test_extract_text_with_tika -vv -s --cov-branch --cov-report=term --basetemp=/code/modules/weko-deposit/.tox/c1/tmp +def test_extract_text_with_tika(): + filepath = os.path.join(os.path.dirname(__file__),"data","test_files","sample_word.docx") + # not exist tika jar file. + mock_env_not_exist_tika = {"TIKA_JAR_FILE_PATH": "/not/exist/path/tika-server.jar"} + with patch.dict(os.environ, mock_env_not_exist_tika, clear=False): + with pytest.raises(Exception) as e: + data = extract_text_with_tika(filepath, 100) + assert str(e.value) == "not exist tika jar file." + + mock_env_not_exist_tika = {"TIKA_JAR_FILE_PATH": "/code/tika/tika-app-2.6.0.jar"} + with patch.dict(os.environ, mock_env_not_exist_tika, clear=False): + # error with subprocess + mock_run = MagicMock() + mock_run.returncode.return_value=1 + mock_run.stderr.decode.return_value="test_error" + with patch("weko_deposit.utils.subprocess.run", return_value=mock_run): + with pytest.raises(Exception) as e: + data = extract_text_with_tika(filepath, 100) + assert str(e.value) == "raise in tika: test_error" + + # file size > max_size + data = extract_text_with_tika(filepath, 50) + assert len(data.encode('utf-8')) < 50 + assert data == "これはテスト用のサンプルwordファイ" + + # file size <= max_size + data = extract_text_with_tika(filepath, 5000) + assert len(data.encode('utf-8')) > 50 + assert data == "これはテスト用のサンプルwordファイルです中身は特に意味がありません" diff --git a/modules/weko-deposit/weko_deposit/utils.py b/modules/weko-deposit/weko_deposit/utils.py index a47761dd9e..0c7cd5a1d1 100644 --- a/modules/weko-deposit/weko_deposit/utils.py +++ b/modules/weko-deposit/weko_deposit/utils.py @@ -20,6 +20,10 @@ from .tasks import extract_pdf_and_update_file_contents from .api import WekoDeposit +import pypdfium2 +import os +import subprocess + def update_pdf_contents_es(record_ids): """register the contents of the record PDF file in elasticsearch @@ -29,4 +33,73 @@ def update_pdf_contents_es(record_ids): deposits = WekoDeposit.get_records(record_ids) for dep in deposits: file_infos = dep.get_pdf_info() - extract_pdf_and_update_file_contents.apply_async((file_infos, str(dep.id))) \ No newline at end of file + extract_pdf_and_update_file_contents.apply_async((file_infos, str(dep.id))) + + +def extract_text_from_pdf(filepath, max_size): + """Read PDF file and extract text. + + Args: + filepath (str): Path to the PDF file. + max_size (int): Maximum size of the extracted text in bytes. + + Returns: + str: Extracted text from the PDF file. + + """ + reader = None + data = "" + try: + reader = pypdfium2.PdfDocument(filepath) + texts = [] + total_bytes = 0 + for page in reader: + text = page.get_textpage().get_text_range() + encoded = text.encode('utf-8', errors='replace') + if total_bytes + len(encoded) > max_size: + remain = max_size - total_bytes + texts.append(encoded[:remain].decode('utf-8', errors='ignore')) + break + else: + texts.append(text) + total_bytes += len(encoded) + data = "".join(texts) + data = "".join(data.splitlines()) + finally: + if reader is not None: + reader.close() + + return data + + +def extract_text_with_tika(filepath, max_size): + """Read non-PDF file and extract text. + + Args: + filepath (str): Path to the PDF file. + max_size (int): Maximum size of the extracted text in bytes. + + Raises: + Exception: If Tika jar file does not exist. + Exception: If Tika processing fails. + + Returns: + str: Extracted text from the non-PDF file. + """ + tika_jar_path = os.environ.get("TIKA_JAR_FILE_PATH") + if not tika_jar_path or os.path.isfile(tika_jar_path) is False: + raise Exception("not exist tika jar file.") + args = ["java", "-jar", tika_jar_path, "-t", filepath] + result = subprocess.run( + args, + stdout=subprocess.PIPE, + stderr=subprocess.PIPE, + ) + if result.returncode != 0: + raise Exception("raise in tika: {}".format(result.stderr.decode("utf-8"))) + data = "".join(result.stdout.decode("utf-8").splitlines()) + if len(data.encode('utf-8')) > max_size: + encoded = data.encode('utf-8') + data = encoded[:max_size].decode('utf-8', errors='ignore') + + return data diff --git a/modules/weko-records-ui/weko_records_ui/templates/weko_records_ui/output_detail_data.html b/modules/weko-records-ui/weko_records_ui/templates/weko_records_ui/output_detail_data.html index 0c5c412a5c..b1c7ed794b 100644 --- a/modules/weko-records-ui/weko_records_ui/templates/weko_records_ui/output_detail_data.html +++ b/modules/weko-records-ui/weko_records_ui/templates/weko_records_ui/output_detail_data.html @@ -72,7 +72,7 @@ {%- endfor -%} {%- else -%} {{ output_attribute_value_mlt_Init( record_detail_data ) }} - {%- endif -%} + {%- endif -%} {%- endif -%} {% endmacro %} @@ -83,7 +83,7 @@ {% if parrent_name %} {%- set labels = parrent_name.split('.') -%} {%- if labels|length == 1 -%} - {{ child_data(parrent_name, '', level) }} + {{ child_data(parrent_name, ' ', level) }} {%- else -%} {%- set displayflag = False -%} {%- endif -%} @@ -118,7 +118,7 @@ {{ content | escape_str }} {%- elif content|url_to_link -%} {{ content | escape_str }} - {%- else -%} + {%- else -%} {{ content | escape_str }} {%- endif -%} {% endautoescape %} @@ -207,7 +207,7 @@ {%- set nsflg.dispflg = True -%} {%- endif -%} {%- endfor -%} - {%- endif -%} + {%- endif -%} {%- endif -%} {%- endfor -%} {%- for language_value in language_data -%} @@ -245,7 +245,7 @@ {%- if value is string -%} {%- if attribute_data|length == 2 -%} {{ output_attribute_value_mlt(attribute_data, level) }} - {%- else -%} + {%- else -%} {{ output_attribute_value_mlt_exceptlang(attribute_data,level) }} {%- endif -%} {%- else -%} diff --git a/modules/weko-search-ui/requirements2.txt b/modules/weko-search-ui/requirements2.txt index 3c30c7d8a7..f203b6675a 100644 --- a/modules/weko-search-ui/requirements2.txt +++ b/modules/weko-search-ui/requirements2.txt @@ -287,3 +287,4 @@ xmlschema==0.9.30 xmltodict==0.12.0 zipp==3.6.0 zope.interface==5.5.2 +pypdfium2==4.30.0 diff --git a/modules/weko-search-ui/tests/conftest.py b/modules/weko-search-ui/tests/conftest.py index 9c9c58582c..03f0156a8f 100644 --- a/modules/weko-search-ui/tests/conftest.py +++ b/modules/weko-search-ui/tests/conftest.py @@ -136,7 +136,13 @@ from weko_deposit.api import WekoDeposit from weko_deposit.api import WekoDeposit as aWekoDeposit from weko_deposit.api import WekoIndexer, WekoRecord -from weko_deposit.config import WEKO_BUCKET_QUOTA_SIZE, WEKO_MAX_FILE_SIZE +from weko_deposit.config import ( + WEKO_BUCKET_QUOTA_SIZE, + WEKO_MAX_FILE_SIZE, + WEKO_DEPOSIT_FILESIZE_LIMIT, + WEKO_MIMETYPE_WHITELIST_FOR_ES, + WEKO_DEPOSIT_TEXTMIMETYPE_WHITELIST_FOR_ES +) from weko_groups import WekoGroups from weko_index_tree import WekoIndexTree, WekoIndexTreeREST from weko_index_tree.api import Indexes @@ -694,7 +700,10 @@ def base_app(instance_path, search_class, request): WEKO_ITEMS_UI_INDEX_PATH_SPLIT = '///', WEKO_SEARCH_UI_BULK_EXPORT_RETRY = 5, WEKO_SEARCH_UI_BULK_EXPORT_LIMIT = 100, - RECORDS_UI_ENDPOINTS = RECORDS_UI_ENDPOINTS + RECORDS_UI_ENDPOINTS = RECORDS_UI_ENDPOINTS, + WEKO_DEPOSIT_FILESIZE_LIMIT = WEKO_DEPOSIT_FILESIZE_LIMIT, + WEKO_MIMETYPE_WHITELIST_FOR_ES = WEKO_MIMETYPE_WHITELIST_FOR_ES, + WEKO_DEPOSIT_TEXTMIMETYPE_WHITELIST_FOR_ES = WEKO_DEPOSIT_TEXTMIMETYPE_WHITELIST_FOR_ES ) app_.url_map.converters["pid"] = PIDConverter app_.config["RECORDS_REST_ENDPOINTS"]["recid"]["search_class"] = search_class diff --git a/modules/weko-search-ui/tests/data/ams/broken_word.docx b/modules/weko-search-ui/tests/data/ams/broken_word.docx new file mode 100644 index 0000000000..3fa5f4e582 Binary files /dev/null and b/modules/weko-search-ui/tests/data/ams/broken_word.docx differ diff --git a/modules/weko-search-ui/tests/data/ams/png_file.pdf b/modules/weko-search-ui/tests/data/ams/png_file.pdf new file mode 100644 index 0000000000..cc8d7bda54 Binary files /dev/null and b/modules/weko-search-ui/tests/data/ams/png_file.pdf differ diff --git a/modules/weko-search-ui/tests/data/ams/png_file.txt b/modules/weko-search-ui/tests/data/ams/png_file.txt new file mode 100644 index 0000000000..cc8d7bda54 Binary files /dev/null and b/modules/weko-search-ui/tests/data/ams/png_file.txt differ diff --git a/modules/weko-search-ui/tests/data/ams/sample.txt b/modules/weko-search-ui/tests/data/ams/sample.txt new file mode 100644 index 0000000000..990383c64b --- /dev/null +++ b/modules/weko-search-ui/tests/data/ams/sample.txt @@ -0,0 +1,2 @@ +This is a +text file. diff --git a/modules/weko-search-ui/tests/data/ams/with_two_extended_metadata.json b/modules/weko-search-ui/tests/data/ams/with_two_extended_metadata.json new file mode 100644 index 0000000000..eb70def6c2 --- /dev/null +++ b/modules/weko-search-ui/tests/data/ams/with_two_extended_metadata.json @@ -0,0 +1,99 @@ +{ + "@id": "./", + "@type": "Dataset", + "datePublished": "2025-10-22", + "name": "extract", + "description": "Item metadata for Item ID: 2000036. Title: extract.", + "wk:index": [ + "1623632832836" + ], + "wk:publishStatus": "public", + "wk:feedbackMail": [], + "wk:requestMail": [], + "wk:grant": [], + "wk:editMode": "Keep", + "dc:title": [ + { + "@id": "#:title_0", + "@type": "PropertyValue", + "value": "extract", + "language": "ja" + } + ], + "dc:type": { + "@id": "#:type_1", + "@type": "PropertyValue", + "rdf:resource": "departmental bulletin paper", + "value": "http://purl.org/coar/resource_type/c_6501" + }, + "hasPart": [ + { + "@id": "data/guide.pdf", + "@type": "File", + "dcterms:accessRights": "open_access", + "datePublished": "2025-10-22", + "name": "guide.pdf", + "jpcoar:extent": [ + { + "@id": "#:extent_3", + "@type": "File", + "value": "844 KB" + } + ], + "jpcoar:mimeType": "application/pdf", + "jpcoar:URI": { + "@id": "#:URI_4", + "@type": "URL", + "value": "https://192.168.56.102/record/2000036/files/guide.pdf" + }, + "wk:textExtraction": true, + "wk:extendedMetadata": true + }, + { + "@id": "data/sample.txt", + "@type": "File", + "dcterms:accessRights": "open_access", + "datePublished": "2025-10-22", + "name": "sample.txt", + "jpcoar:extent": [ + { + "@id": "#:extent_6", + "@type": "File", + "value": "51 B" + } + ], + "jpcoar:mimeType": "text/plain", + "jpcoar:URI": { + "@id": "#:URI_7", + "@type": "URL", + "value": "https://192.168.56.102/record/2000036/files/sample.txt" + }, + "wk:textExtraction": true, + "wk:extendedMetadata": true + }, + { + "@id": "data/pp.pptx", + "@type": "File", + "dcterms:accessRights": "open_access", + "datePublished": "2025-10-22", + "name": "pp.pptx", + "jpcoar:extent": [ + { + "@id": "#:extent_9", + "@type": "File", + "value": "432 KB" + } + ], + "jpcoar:mimeType": "application/vnd.openxmlformats-officedocument.presentationml.presentation", + "jpcoar:URI": { + "@id": "#:URI_10", + "@type": "URL", + "value": "https://192.168.56.102/record/2000036/files/pp.pptx" + }, + "wk:textExtraction": true, + "wk:extendedMetadata": false + } + ], + "wk:itemLinks": [], + "wk:metadataAutoFill": false +} diff --git a/modules/weko-search-ui/tests/data/ams/without_hasPart.json b/modules/weko-search-ui/tests/data/ams/without_hasPart.json new file mode 100644 index 0000000000..a4a18e1ba1 --- /dev/null +++ b/modules/weko-search-ui/tests/data/ams/without_hasPart.json @@ -0,0 +1,31 @@ +{ + "@id": "./", + "@type": "Dataset", + "datePublished": "2025-10-22", + "name": "extract", + "description": "Item metadata for Item ID: 2000036. Title: extract.", + "wk:index": [ + "1623632832836" + ], + "wk:publishStatus": "public", + "wk:feedbackMail": [], + "wk:requestMail": [], + "wk:grant": [], + "wk:editMode": "Keep", + "dc:title": [ + { + "@id": "#:title_0", + "@type": "PropertyValue", + "value": "extract", + "language": "ja" + } + ], + "dc:type": { + "@id": "#:type_1", + "@type": "PropertyValue", + "rdf:resource": "departmental bulletin paper", + "value": "http://purl.org/coar/resource_type/c_6501" + }, + "wk:itemLinks": [], + "wk:metadataAutoFill": false +} diff --git "a/modules/weko-search-ui/tests/data/ams/\343\202\265\343\203\263\343\203\227\343\203\2532.txt" "b/modules/weko-search-ui/tests/data/ams/\343\202\265\343\203\263\343\203\227\343\203\2532.txt" new file mode 100644 index 0000000000..793629ceea --- /dev/null +++ "b/modules/weko-search-ui/tests/data/ams/\343\202\265\343\203\263\343\203\227\343\203\2532.txt" @@ -0,0 +1 @@ +上限:8バイト diff --git a/modules/weko-search-ui/tests/data/jsonld/ro-crate-metadata.json b/modules/weko-search-ui/tests/data/jsonld/ro-crate-metadata.json index 4cf2aec9d1..6783aa33ac 100644 --- a/modules/weko-search-ui/tests/data/jsonld/ro-crate-metadata.json +++ b/modules/weko-search-ui/tests/data/jsonld/ro-crate-metadata.json @@ -90,13 +90,13 @@ ], "hasPart": [ { - "@id": "data/sample.txt" + "@id": "sample.txt" }, { - "@id": "data/data.csv" + "@id": "data.csv" }, { - "@id": "data/0606/data.csv" + "@id": "0606/data.csv" }, { "@id": "https://example.com/test/sample/1" @@ -447,7 +447,7 @@ "value": "Example Organization" }, { - "@id": "data/data.csv", + "@id": "data.csv", "@type": "File", "dcterms:accessRights": "open_login", "datePublished": "2025-06-06", @@ -469,7 +469,7 @@ "wk:textExtraction": false }, { - "@id": "data/0606/data.csv", + "@id": "0606/data.csv", "@type": "File", "dcterms:accessRights": "open_login", "datePublished": "2025-06-06", @@ -491,7 +491,7 @@ "wk:textExtraction": true }, { - "@id": "data/sample.txt", + "@id": "sample.txt", "@type": "File", "dcterms:accessRights": "open_access", "datePublished": "2025-06-06", diff --git a/modules/weko-search-ui/tests/data/jsonld/ro-crate-metadata2.json b/modules/weko-search-ui/tests/data/jsonld/ro-crate-metadata2.json index 813a3e6155..14ecf082e1 100644 --- a/modules/weko-search-ui/tests/data/jsonld/ro-crate-metadata2.json +++ b/modules/weko-search-ui/tests/data/jsonld/ro-crate-metadata2.json @@ -72,7 +72,7 @@ ], "hasPart": [ { - "@id": "data/sample.rst" + "@id": "sample.rst" } ], "hasPolicy": [ @@ -155,7 +155,7 @@ ], "hasPart": [ { - "@id": "data/data.csv" + "@id": "data.csv" } ], "hasPolicy": [ @@ -344,7 +344,7 @@ "jpcoar:identifierRegistration": "DataCite" }, { - "@id": "data/sample.rst", + "@id": "sample.rst", "@type": "File", "name": "sample.rst", "contentSize": "333", @@ -360,7 +360,7 @@ "wk:accessMode": "open_access" }, { - "@id": "data/data.csv", + "@id": "data.csv", "@type": "File", "name": "data.csv", "contentSize": "1234", diff --git a/modules/weko-search-ui/tests/test_mapper.py b/modules/weko-search-ui/tests/test_mapper.py index 0392cb4f55..ce4510661f 100644 --- a/modules/weko-search-ui/tests/test_mapper.py +++ b/modules/weko-search-ui/tests/test_mapper.py @@ -1,10 +1,13 @@ +import json import pytest import xmltodict import uuid +import json from datetime import date from mock import patch from unittest.mock import MagicMock from collections import OrderedDict +from pypdfium2 import PdfiumError from weko_records.api import Mapping from weko_records.models import ItemType,ItemTypeName @@ -4717,6 +4720,7 @@ def test_to_item_metadata(self, app, db, item_type2, item_type_mapping2): assert system_info["cnri"] == "1234/5678" assert system_info["doi_ra"] == "DataCite" assert system_info["doi"] == "10.1234/5678" + assert system_info["file_path"] == ["sample.txt", "data.csv", "0606/data.csv", ""] assert system_info["non_extract"] == ["data.csv"] assert system_info["save_as_is"] == False assert system_info["amend_doi"] == "10.2964/jsik_2021_067" @@ -4757,14 +4761,53 @@ def test_to_item_metadata(self, app, db, item_type2, item_type_mapping2): assert list_record[0].get("errors") is None + schema["properties"].update({ + "item_1754636750964": { + "type": "string", + "title": "Extra", + "format": "textarea" + } + }) + item_type2.model.schema = schema + db.session.commit() + json_ld["@graph"][0].update({ + "additional": { "@id": "#additional" } + }) + json_ld["@graph"].append({ + "@id": "#additional", + "value": "This is an extra field for testing." + }) + with app.test_request_context(): + mapper = JsonLdMapper(item_type2.model.id, json_mapping) + item_metadatas, format = mapper.to_item_metadata(json_ld) + item_metadata, system_info = item_metadatas[0] + assert isinstance(item_metadata["item_1754636750964"], str) + assert isinstance(json.loads(item_metadata["item_1754636750964"]), dict) + + schema = json_data("data/jsonld/item_type_schema.json") schema = json_data("data/jsonld/item_type_schema.json") + schema["properties"].update({ + "item_1744171568909": { + "type": "array", + "items": { + "type": "object", + "properties": { + "interim": { + "type": "string" + } + } + }, + "title": "Extra", + "maxItems": 9999, + "minItems": 1 + } + }) item_type2.model.schema = schema mapping = json_data("data/jsonld/item_type_mapping.json") item_type_mapping2.model.mapping = mapping db.session.commit() json_mapping = json_data("data/jsonld/ro-crate_mapping.json") json_ld = json_data("data/jsonld/ro-crate-metadata2.json") - with app.test_request_context(): mapper = JsonLdMapper(item_type2.model.id, json_mapping) item_metadatas, format = mapper.to_item_metadata(json_ld) @@ -4776,21 +4819,25 @@ def test_to_item_metadata(self, app, db, item_type2, item_type_mapping2): assert system_info["_id"] == "_:JournalPaper1" assert system_info["link_data"][0]["item_id"] == "_:EvidenceData1" assert system_info["link_data"][0]["sele_id"] == "isSupplementedBy" + assert system_info["file_path"] == ["sample.rst"] assert thesis["pubdate"] == "2021-10-15" assert thesis["path"] == [1623632832836] assert thesis["item_30001_title0"][0]["subitem_title"] == "The Sample Dataset for WEKO" assert thesis["item_30001_title0"][1]["subitem_title"] == "WEKO用サンプルデータセット" assert thesis["files_info"][0]["key"] == "item_30001_file22" + assert thesis["item_1744171568909"][0]["interim"] evidence, system_info = item_metadatas[1] assert system_info["_id"] == "_:EvidenceData1" assert system_info["link_data"][0]["item_id"] == "_:JournalPaper1" assert system_info["link_data"][0]["sele_id"] == "isSupplementTo" + assert system_info["file_path"] == ["data.csv"] assert system_info["non_extract"] == ["data.csv"] assert evidence["pubdate"] == "2021-10-15" assert evidence["path"] == [1623632832836] assert evidence["item_30001_title0"][0]["subitem_title"] == "The Sample Dataset for WEKO, evidence part" assert evidence["item_30001_title0"][1]["subitem_title"] == "WEKO用サンプルデータセットのエビデンス部分" + assert evidence["item_1744171568909"][0]["interim"] list_record = [ { @@ -4808,16 +4855,18 @@ def test_to_item_metadata(self, app, db, item_type2, item_type_mapping2): # def deconstruct_json_ld(json_ld): # .tox/c1/bin/pytest --cov=weko_search_ui tests/test_mapper.py::TestJsonLdMapper::test__deconstruct_json_ld -v -vv -s --cov-branch --cov-report=xml --basetemp=/code/modules/weko-search-ui/.tox/c1/tmp - def test__deconstruct_json_ld(self, app): + def test__deconstruct_json_ld(self, app, item_type2): json_ld = json_data("data/jsonld/ro-crate-metadata.json") - deconstructed_metadata, format = JsonLdMapper._deconstruct_json_ld(json_ld) + mapper = JsonLdMapper(item_type2.model.id, None) + deconstructed_metadata, format = mapper._deconstruct_json_ld(json_ld) metadata, system_info = deconstructed_metadata[0] assert format == "ro-crate" assert system_info["cnri"] == "1234/5678" assert system_info["doi_ra"] == "DataCite" assert system_info["doi"] == "10.1234/5678" - assert system_info["non_extract"] == ["data/data.csv"] + assert system_info["file_path"] == ["sample.txt", "data.csv", "0606/data.csv", "https://example.com/test/sample/1"] + assert system_info["non_extract"] == ["data.csv"] assert system_info["save_as_is"] == False assert metadata["@id"] == "./" assert metadata["name"] == "The Sample Dataset for WEKO" @@ -4829,15 +4878,16 @@ def test__deconstruct_json_ld(self, app): assert metadata["dc:title[1].language"] == "ja" assert metadata["dc:type.rdf:resource"] == "http://purl.org/coar/resource_type/c_ddb1" assert metadata["dc:type.value"] == "dataset" - assert metadata["hasPart[0].@id"] == "data/sample.txt" + assert metadata["hasPart[0].@id"] == "sample.txt" assert metadata["hasPart[0].name"] == "sample.txt" - assert metadata["hasPart[1].@id"] == "data/data.csv" + assert metadata["hasPart[1].@id"] == "data.csv" assert metadata["hasPart[1].name"] == "data.csv" assert metadata["dcterms:accessRights.value"] == "embargoed access" assert not any("@type" in key for key in metadata.keys()) json_ld = json_data("data/jsonld/ro-crate-metadata2.json") - deconstructed_metadata, format = JsonLdMapper._deconstruct_json_ld(json_ld) + mapper = JsonLdMapper(item_type2.model.id, None) + deconstructed_metadata, format = mapper._deconstruct_json_ld(json_ld) thesis, system_info = deconstructed_metadata[0] assert format == "ro-crate" @@ -4846,6 +4896,7 @@ def test__deconstruct_json_ld(self, app): assert system_info["link_data"][0]["sele_id"] == "isSupplementedBy" assert system_info["link_data"][1]["item_id"] == "https://example.repo.nii.ac.jp/records/123456789" assert system_info["link_data"][1]["sele_id"] == "isSupplementedBy" + assert system_info["file_path"] == ["sample.rst"] assert thesis["@id"] == "_:JournalPaper1" assert thesis["dc:title[0].value"] == "The Sample Dataset for WEKO" assert thesis["dc:title[1].value"] == "WEKO用サンプルデータセット" @@ -4857,7 +4908,8 @@ def test__deconstruct_json_ld(self, app): assert system_info["_id"] == "_:EvidenceData1" assert system_info["link_data"][0]["item_id"] == "_:JournalPaper1" assert system_info["link_data"][0]["sele_id"] == "isSupplementTo" - assert system_info["non_extract"] == ["data/data.csv"] + assert system_info["file_path"] == ["data.csv"] + assert system_info["non_extract"] == ["data.csv"] assert evidence["@id"] == "_:EvidenceData1" assert evidence["dc:title[0].value"] == "The Sample Dataset for WEKO, evidence part" assert evidence["dc:title[1].value"] == "WEKO用サンプルデータセットのエビデンス部分" @@ -4865,7 +4917,8 @@ def test__deconstruct_json_ld(self, app): assert evidence["dc:type.@id"] == "http://purl.org/coar/resource_type/c_1843" with pytest.raises(ValueError) as ex: - deconstructed_metadata, format = JsonLdMapper._deconstruct_json_ld({}) + mapper = JsonLdMapper(item_type2.model.id, None) + deconstructed_metadata, format = mapper._deconstruct_json_ld({}) ex.match('Invalid json-ld format: "@context" is invalid.') # def to_rocrate_metadata(self, metadata): @@ -4929,10 +4982,10 @@ def test_to_rocrate_metadata(self, app, db, item_type2, item_type_mapping2, mock haspart_1 = graph["hasPart"][1]["@id"] file_1 = rocrate.dereference(haspart_1) - assert haspart_0 == "data/sample.txt" + assert haspart_0 == "sample.txt" assert file_0["name"] == "sample.txt" assert rocrate.dereference(file_0["jpcoar:URI"]["@id"])["value"] == "https://localhost/record/2000001/files/sample.txt" - assert haspart_1 == "data/data.csv" + assert haspart_1 == "data.csv" assert file_1["name"] == "data.csv" assert rocrate.dereference(file_1["jpcoar:URI"]["@id"])["value"] == "https://localhost/record/2000001/files/data.csv" @@ -5240,3 +5293,102 @@ def test_to_item_metadata_ams_dict(self, app, db, item_type2): assert item_metadata["item_1736145554459"]["subitem_date_issued_datetime"] == "2025-06-11" assert item_metadata["item_1749689698804"]["subitem_relation_type_id"]["subitem_relation_type_id_text"] == "grdm" assert item_metadata["item_1749689698804"]["subitem_relation_type"] == "isVersionOf" + + + # def extract_extended_metadata(self, list_extracted): + # .tox/c1/bin/pytest --cov=weko_search_ui tests/test_mapper.py::TestJsonLdMapper::test_extract_extended_metadata -v -vv -s --cov-branch --cov-report=html --basetemp=/code/modules/weko-search-ui/.tox/c1/tmp + def test_extract_extended_metadata(self, app, db, item_type2, mocker): + mapper = JsonLdMapper(item_type2.model.id, None) + values = ["first", "second"] + mocker.patch.object(mapper, "extract_text_from_files", + side_effect = values) + + rocrate = json_data("data/ams/with_two_extended_metadata.json") + rocrate = mapper.extract_extended_metadata([rocrate])[0] + + ids = [part["@id"] + for part in rocrate.get("hasPart", []) + if "@id" in part] + assert ids == ["data/pp.pptx"] + + ext = rocrate["extended_metadata"]["value"] + ext = json.loads(ext) + + assert len(ext) == 2 + assert ext["data/sample.txt"] == "first" + assert ext["data/guide.pdf"] == "second" + + # without hasPart + rocrate = json_data("data/ams/without_hasPart.json") + rocrate = mapper.extract_extended_metadata([rocrate])[0] + assert "extended_metadata" not in rocrate + + # def extract_text_from_files(self, filename): + # .tox/c1/bin/pytest --cov=weko_search_ui tests/test_mapper.py::TestJsonLdMapper::test_extract_text_from_files -v -vv -s --cov-branch --cov-report=html --basetemp=/code/modules/weko-search-ui/.tox/c1/tmp + def test_extract_text_from_files(self, app, db, item_type2, mocker, tmp_path): + mapper = JsonLdMapper(item_type2.model.id, None) + + mapper.data_path = str(tmp_path) + file_content = "これは\r\nテキストファイルです\r\n" + + file_name = "サンプル.txt" + tmpfile = tmp_path / file_name + tmpfile.write_text(file_content, encoding="shift_jis") + extract_text = mapper.extract_text_from_files(file_name) + assert extract_text == file_content + + file_name = "サンプル.TXT" + tmpfile = tmp_path / file_name + tmpfile.write_text(file_content, encoding="utf-8") + extract_text = mapper.extract_text_from_files(file_name) + assert extract_text == file_content + + file_name = "サンプル.txt" + tmpfile = tmp_path / file_name + tmpfile.write_text(file_content, encoding="utf-8") + extract_text = mapper.extract_text_from_files(file_name) + assert extract_text == "" + + mapper.data_path = "tests/data/ams" + + app.config.update({"WEKO_DEPOSIT_FILESIZE_LIMIT": 8}) + extract_text = mapper.extract_text_from_files("sample.txt") + assert extract_text == "This is " + + app.config.update({"WEKO_DEPOSIT_FILESIZE_LIMIT": 8}) + extract_text = mapper.extract_text_from_files("サンプル2.txt") + assert extract_text == "上限:8" + + app.config.update({"WEKO_DEPOSIT_FILESIZE_LIMIT": 2 * 1024 * 1024}) + extract_text = mapper.extract_text_from_files("sample.txt") + assert extract_text == "This is a\ntext file.\n" + + with pytest.raises(ValueError) as e: + extract_text = mapper.extract_text_from_files("png_file.txt") + assert str(e.value) == "Failed to load text file: png_file.txt" + + with pytest.raises(PdfiumError) as e: + extract_text = mapper.extract_text_from_files("png_file.pdf") + assert str(e.value) == "Failed to load PDF file: png_file.pdf" + + with pytest.raises(ValueError) as e: + extract_text = mapper.extract_text_from_files("broken_word.docx") + assert str(e.value) == "Failed to load document: broken_word.docx" + + with pytest.raises(FileNotFoundError) as e: + extract_text = mapper.extract_text_from_files("not_exist.txt") + assert str(e.value) == "File Not Found: not_exist.txt" + + mocker.patch("weko_search_ui.mapper.extract_text_from_pdf", + return_value="This is a pdf file.") + mocker.patch("os.path.isfile", return_value=True) + extract_text = mapper.extract_text_from_files("pdffile.pdf") + assert extract_text == "This is a pdf file." + + mocker.patch("weko_search_ui.mapper.extract_text_with_tika", + return_value="This is a pptx file.") + extract_text = mapper.extract_text_from_files("powerpoint.pptx") + assert extract_text == "This is a pptx file." + + extract_text = mapper.extract_text_from_files("sample.other") + assert extract_text == "" diff --git a/modules/weko-search-ui/tests/test_utils.py b/modules/weko-search-ui/tests/test_utils.py index cfec92af9f..ec5cb95c46 100644 --- a/modules/weko-search-ui/tests/test_utils.py +++ b/modules/weko-search-ui/tests/test_utils.py @@ -930,7 +930,8 @@ def test_handle_convert_validate_msg_to_jp(i18n_app): # def handle_validate_item_import(list_record, schema) -> list: -def test_handle_validate_item_import(app, mocker_itemtype): +# .tox/c1/bin/pytest --cov=weko_search_ui tests/test_utils.py::test_handle_validate_item_import -vv -s --cov-branch --cov-report=term --basetemp=/code/modules/weko-search-ui/.tox/c1/tmp +def test_handle_validate_item_import(app, mocker_itemtype, mocker): filepath = os.path.join( os.path.dirname(os.path.realpath(__file__)), "data", "csv", "data.json" ) @@ -964,6 +965,96 @@ def test_handle_validate_item_import(app, mocker_itemtype): == result ) + schema = { + "type": "object", + "properties": { + "item_xxx": { + "type": "object", + "properties": { + "subitem_yyy": { + "type": "array", + "items": { + "type": "object", + "properties": { + "subitem_zzz": { + "type": "string", + } + } + } + } + } + } + } + } + + list_record = [ + { + "metadata": { + 'item_xxx': { + 'subitem_yyy':[ + {"subitem_zzz": 123} + ] + } + } + } + ] + with app.test_request_context(): + with set_locale("en"): + result = handle_validate_item_import(list_record, schema) + warnings = result[0].get("warnings", []) + target = list_record[0]["metadata"]['item_xxx']['subitem_yyy'][0]["subitem_zzz"] + assert any("Replace value of" in w for w in warnings) + assert any("is different from existing" in w for w in warnings) + assert type(target) == str + + list_record[0]["metadata"]['item_xxx']['subitem_yyy'][0]["subitem_zzz"] = 456 + + with app.test_request_context(): + with set_locale("ja"): + result = handle_validate_item_import(list_record, schema) + warnings = result[0].get("warnings", []) + assert any("へ置き換えました。" in w for w in warnings) + assert any("と異なっています。" in w for w in warnings) + + schema = { + "type": "object", + "properties": { + "item_aaa": { + "type": "object", + "properties": { + "subitem_bbb": { + "type": "object", + "properties": { + "subitem_ccc": { + "enum": [None, "Yes|Yes", "No|No"], + } + } + } + } + } + } + } + + list_record = [ + { + "metadata": { + 'item_aaa': { + 'subitem_bbb': { + "subitem_ccc": "Yes" + } + } + } + } + ] + with app.test_request_context(): + with set_locale("en"): + result = handle_validate_item_import(list_record, schema) + assert "errors" in result[0] + + with app.test_request_context(): + with set_locale("ja"): + result = handle_validate_item_import(list_record, schema) + assert "errors" in result[0] # def represents_int(s): def test_represents_int(): diff --git a/modules/weko-search-ui/weko_search_ui/mapper.py b/modules/weko-search-ui/weko_search_ui/mapper.py index 9ebeb7d102..89a6578c09 100644 --- a/modules/weko-search-ui/weko_search_ui/mapper.py +++ b/modules/weko-search-ui/weko_search_ui/mapper.py @@ -10,6 +10,10 @@ import os import re +import json +import chardet +import mimetypes +from pypdfium2 import PdfiumError import itertools import xmltodict import traceback @@ -18,6 +22,7 @@ from functools import partial, reduce from rocrate.rocrate import ROCrate from rocrate.model.contextentity import ContextEntity +from urllib.parse import urlparse from flask import current_app, url_for @@ -26,6 +31,7 @@ Mapping, ItemTypes, FeedbackMailList, RequestMailList, ItemLink ) from weko_records.serializers.utils import get_full_mapping +from weko_deposit.utils import extract_text_from_pdf, extract_text_with_tika from .config import ROCRATE_METADATA_FILE, ROCRATE_METADATA_WK_CONTEXT_V1 @@ -1270,7 +1276,6 @@ def _get_property_type(self, chained_path): Returns: str: property type. e.g. "string", "array", "object" """ - # property_type = "" properties = self.itemtype.schema.get("properties") for p in chained_path.split("."): if properties[p].get("type") == "object": @@ -1449,6 +1454,13 @@ def _map_to_item(self, metadata, system_info): fixed_properties[key] = {} fixed_properties[key][sub_key] = value + def is_url(s: str) -> bool: + try: + result = urlparse(s) + return all([result.scheme, result.netloc]) + except ValueError: + return False + mapped_metadata = {} system_info = { **system_info, @@ -1458,115 +1470,19 @@ def _map_to_item(self, metadata, system_info): **({"uri": system_info["uri"]} if isinstance(system_info.get("uri"), str) else {}), "file_path": [ - filename[5:] for filename in system_info["file_path"] - if filename.startswith("data/") + filename if not is_url(filename) else "" + for filename in system_info["file_path"] ], "non_extract": [ - filename[5:] for filename in system_info["non_extract"] - if filename.startswith("data/") + filename for filename in system_info["non_extract"] + if not is_url(filename) ], + "warnings": [], } missing_metadata = {} - def _empty_metadata(parent_prop_key): - return fixed_properties.get(parent_prop_key, {}) - - def _set_metadata(parent, meta_props, prop_props): - """ - Args: - parent (dict): parent metadata. - meta_props (list[str]): - json-ld hierarchy split by ".". - prop_props (list[str]): - itemtype metadata metadata split by ".". - """ - # META_KEY="dc:type.@id", meta_props=["dc:type", "@id"] - # PROP_PATH=item_30001_resource_type11.resourceuri, prop_props=["item_30001_resource_type11","resourceuri"] - if len(prop_props) == 0: - raise Exception("Unexpected error: prop_props is empty.") - if len(prop_props) == 1: - if self._get_property_type(PROP_PATH) == "array": - schema = self.itemtype.schema["properties"] - for prop in PROP_PATH: - schema = schema.get(prop) - schema = schema.get("items").get("properties") - interim = list(schema.keys())[0] - if parent.get(prop_props[0]) is None: - parent[prop_props[0]] = [ - {interim: META_VALUE} - ] - else: - parent[prop_props[0]].append( - {interim: META_VALUE} - ) - else: - parent.update({prop_props[0]: META_VALUE}) - return - - full_props = PROP_PATH.split(".") - parent_prop_key = ".".join( - full_props[:(len(full_props) - len(prop_props) + 1)] - ) - m_index = re.search(r"\[(\d+)\]", meta_props[0]) - index = int(m_index.group(1)) if m_index is not None else None - if ( - not parent_prop_key in properties_mapping.values() - and not len(meta_props) == 1 - ): - # The corresponding layers are different, - # so the prop_path needs to progress to the lower layer. - sub_prop_key = parent_prop_key + "." + prop_props[1] - if self._get_property_type(parent_prop_key) == "object": - sub_prop_object = parent.get( - prop_props[0], _empty_metadata(parent_prop_key) - ) - sub_sub_object = sub_prop_object.get( - prop_props[1], _empty_metadata(sub_prop_key) - ) - _set_metadata( - sub_sub_object, meta_props[1:], prop_props[1:] - ) - sub_prop_object.update({prop_props[1]: sub_sub_object}) - parent.update({prop_props[0]: sub_prop_object}) - elif self._get_property_type(parent_prop_key) == "array": - sub_prop_array = parent.get(prop_props[0], []) - index = 0 if index is None else index - if len(sub_prop_array) <= index: - sub_prop_array.extend([ - _empty_metadata(parent_prop_key) - for _ in range(index - len(sub_prop_array) + 1) - ]) - sub_sub_object = _empty_metadata(sub_prop_key) - _set_metadata(sub_sub_object, meta_props, prop_props[1:] - ) - sub_prop_array[index].update(sub_sub_object) - parent.update({prop_props[0]: sub_prop_array}) - return - if self._get_property_type(parent_prop_key) == "object": - sub_prop_object = parent.get( - prop_props[0], _empty_metadata(parent_prop_key) - ) - if index is not None and index > 1: - return - _set_metadata(sub_prop_object, meta_props[1:], prop_props[1:] - ) - parent.update({prop_props[0]: sub_prop_object}) - - elif self._get_property_type(parent_prop_key) == "array": - sub_prop_array = parent.get(prop_props[0], []) - index = 0 if index is None else index - if len(sub_prop_array) <= index: - sub_prop_array.extend([ - _empty_metadata(parent_prop_key) - for _ in range(index - len(sub_prop_array) + 1) - ]) - _set_metadata( - sub_prop_array[index], meta_props[1:], prop_props[1:] - ) - parent.update({prop_props[0]: sub_prop_array}) - return - + from flask_babelex import gettext as _ for META_KEY, META_VALUE in metadata.items(): if not isinstance(META_KEY, str): continue @@ -1595,8 +1511,14 @@ def _set_metadata(parent, meta_props, prop_props): ) mapped_metadata["request_mail_list"] = request_mail_list elif META_PATH not in properties_mapping: - if not META_KEY.endswith("@id"): + if ("wk:" not in META_KEY and not META_KEY.endswith("@id") + and META_KEY not in ["name", "description"]): missing_metadata[META_KEY] = META_VALUE + system_info["warnings"].append(_( + "Cannot map to item type from json-ld; " + "Mapping is not defined for the metadata, " + '"%(key)s": "%(value)s"', key=META_KEY, value=META_VALUE + )) else: # item metadata meta_props = META_KEY.split(".") @@ -1610,11 +1532,28 @@ def _set_metadata(parent, meta_props, prop_props): # META_KEY="dc:type.@id", meta_props=["dc:type","@id"], # PROP_PATH=item_30001_resource_type11.resourceuri, prop_props=["item_30001_resource_type11","resourceuri"] try: - _set_metadata(mapped_metadata, meta_props, prop_props) + adjusted_meta_key = self._align_index(META_KEY, properties_mapping) + valid_path = self._check_settable_path(adjusted_meta_key) + if valid_path: + set_by_jsonpath( + mapped_metadata, valid_path, META_VALUE, fixed_properties=fixed_properties + ) + else: + missing_metadata[META_KEY] = META_VALUE + system_info["warnings"].append(_( + "Cannot map to item type from json-ld; " + "Not found mapping destination for the metadata, " + '"%(key)s": "%(value)s"', key=META_KEY, value=META_VALUE + )) except Exception as ex: current_app.logger.warning( - f"Failed to set metadata for {META_KEY}: {META_VALUE}" + f"Failed to set metadata for '{META_KEY}': '{META_VALUE}'" ) + missing_metadata[META_KEY] = META_VALUE + system_info["warnings"].append(_( + "Failed to set metadata for json-ld, " + '"%(key)s": "%(value)s"', key=META_KEY, value=META_VALUE + )) traceback.print_exc() # Check if "Extra" prepared in itemtype schema form item_map @@ -1626,10 +1565,17 @@ def _set_metadata(parent, meta_props, prop_props): extra_key).get("items").get("properties") interim = list(extra_schema.keys())[0] mapped_metadata[item_map.get("Extra")] = [ - {interim: str(missing_metadata)} + {interim: json.dumps(missing_metadata, ensure_ascii=False)} ] else: - mapped_metadata[item_map.get("Extra")] = str(missing_metadata) + mapped_metadata[item_map.get("Extra")] = json.dumps(missing_metadata, ensure_ascii=False) + system_info["warnings"] = [ + _("Metadata which could not be mapped to item type will be set in 'Extra'.") + ] + system_info["warnings"] + elif missing_metadata: + system_info["warnings"] = [ + _("Metadata which could not be mapped to item type will be discarded.") + ] + system_info["warnings"] files_info = [] for v in item_map.values(): @@ -1637,16 +1583,6 @@ def _set_metadata(parent, meta_props, prop_props): continue files_key = v.split(".")[0] - files = mapped_metadata.get(files_key, []) - - # remove "data/" prefix from label - files = [ - file["url"].update({"label": label[5:]}) - for file in files - for label in [file["url"].get("label")] - if label.startswith("data/") - ] - files_info.append({"key": files_key}) mapped_metadata["files_info"] = files_info # mapped_metadata = { @@ -1659,8 +1595,7 @@ def _set_metadata(parent, meta_props, prop_props): # } return mapped_metadata, system_info - @classmethod - def _deconstruct_json_ld(cls, json_ld): + def _deconstruct_json_ld(self, json_ld): """Deconstruct json-ld. Deconstructing json-ld metadata values ​​one by one @@ -1772,10 +1707,11 @@ def _resolve_link(parent, key, value): list_extracted = [ extracted ] else: list_extracted = [ extracted ] + self.extract_extended_metadata(list_extracted) list_deconstructed = [] for extracted in list_extracted: - metadata = cls._deconstruct_dict(extracted) + metadata = self._deconstruct_dict(extracted) system_info = {} system_info.update( {"id": extracted["identifier"]} @@ -1874,6 +1810,171 @@ def _deconstructer(metadata, parent, key, value): return return_data + + def _align_index(self, metadata_key, properties_mapping): + """Map path between json-ld and itemtype metadata. + + Align the indexes of the path and item type path in the json-ld + based on the mapping. + + Args: + metadata_key (str): path in json-ld metadata. + properties_mapping (dict): mapping between json-ld and itemtype metadata. + + Returns: + str|None: Mapped path with index, or None if not found. + """ + # Split meta_key and extract indices + key_parts = re.findall(r'([^\.\[]+)(?:\[(\d+)\])?', metadata_key) # type: list[tuple[str, str]] + key_names = [k for k, _ in key_parts] + key_indices = [idx for _, idx in key_parts] + + # Find the longest matching mapping key + for i in range(len(key_names), 0, -1): + chained = ".".join(key_names[:i]) + if chained in properties_mapping: + mapped = properties_mapping[chained] # type: str + mapped_parts = mapped.split('.') + # meta_key: hasPart[0].dcterms:accessRights + # mapping: hasPart.dcterms:accessRights -> item_30002_file35.accessrole + # → item_30002_file35[0].accessrole + result_parts = [] + for j, part in enumerate(mapped_parts): + idx = key_indices[j] if j < len(key_indices) else None + if idx: + if not re.search(r"\[\d+\]$", part): + part = f"{part}[{idx}]" + result_parts.append(part) + return ".".join(result_parts) + return None + + def _check_settable_path(self, json_path): + """Check if can put value to itemtype property by json path. + + Args: + json_path (str): JSONPath-style string in itemtype property. + + Returns: + str|None: settable json path or None if not settable. + """ + tokens = tokenize_jsonpath(json_path) + settable_path = None + + for element, index, current_path in tokens: + type = self._get_property_type(current_path) + + if type == "array": + if index is not None: + if settable_path: + settable_path += f".{element}[{index}]" + else: + settable_path = f"{element}[{index}]" + else: + if settable_path: + settable_path += f".{element}[0]" + else: + settable_path = f"{element}[0]" + else: + if index is not None and index > 0: + settable_path = None + break + else: + if settable_path: + settable_path += f".{element}" + else: + settable_path = f"{element}" + + if settable_path and re.search(r'\[\d+\]$', settable_path): + return None + + return settable_path + + + def extract_extended_metadata(self, list_extracted): + """ + Store the content of files with wk:extendedMetadata set to True in extended_metadata, + and remove files with wk:extendedMetadata set to True from hasPart. + + Args: + list_extracted (list): List of extracted metadata dictionaries. + Returns: + list: The updated list of extracted metadata with extended metadata merged. + """ + for extracted in list_extracted: + extracted.pop('extended_metadata', None) + if 'hasPart' not in extracted: + continue + file_indices = [ + idx for idx, item in enumerate(extracted['hasPart']) + if item.get('wk:extendedMetadata') is True + ] + if not file_indices: + continue + extended_metadatas = {} + extracted['extended_metadata'] = {} + for idx in reversed(file_indices): + filename = extracted['hasPart'].pop(idx).get('@id') + content = self.extract_text_from_files(filename) + extended_metadatas[filename] = content + extracted['extended_metadata']['value'] = json.dumps( + extended_metadatas, ensure_ascii=False) + return list_extracted + + def extract_text_from_files(self, filename): + """ + Extract text content from the specified file, + only if the file is of a specific MIME type. + Args: + filename (str): The name of the file to extract text from. + + Returns: + str: The extracted text content from the file. + """ + data_path = self.data_path + try: + file_path = os.path.join(data_path, filename) + if not os.path.isfile(file_path): + raise FileNotFoundError + data = "" + mimetype = mimetypes.guess_type(filename)[0] + file_size_limit = current_app.config['WEKO_DEPOSIT_FILESIZE_LIMIT'] + # List of text-based MIME types allowed for text extraction and processing. + text_mimetypes = current_app.config["WEKO_DEPOSIT_TEXTMIMETYPE_WHITELIST_FOR_ES"] + # All mimetypes subject to text extraction (including text_mimetypes) + extract_mimetypes = current_app.config["WEKO_MIMETYPE_WHITELIST_FOR_ES"] + if mimetype not in extract_mimetypes: + return data + + # Extract content from file + current_app.logger.debug(f"extracting content from {filename}") + if mimetype in text_mimetypes: + with open(file_path, "rb") as fp: + data = fp.read(file_size_limit) + inf = chardet.detect(data) + if inf["encoding"] is None: + raise ValueError( + f"Failed to load text file: {filename}") + data = data.decode(inf["encoding"], errors="replace") + elif mimetype == 'application/pdf': + data = extract_text_from_pdf(file_path, file_size_limit) + else: + try: + data = extract_text_with_tika(file_path, file_size_limit) + except Exception as e: + current_app.logger.error(e) + traceback.print_exc() + raise ValueError( + f"Failed to load document: {filename}") from e + except FileNotFoundError as e: + current_app.logger.error(e) + traceback.print_exc() + raise FileNotFoundError(f"File Not Found: {filename}") from e + except PdfiumError as e: + current_app.logger.error(e) + traceback.print_exc() + raise PdfiumError(f"Failed to load PDF file: {filename}") from e + return data + def to_rocrate_metadata( self, record_metadata=None, tsv_row_metadata=None, **kwargs ): @@ -2272,7 +2373,7 @@ def dereference(keys, initial_entity=None): return value # files entity reconstruction - # "@id" in files entity is format like "data/sample.txt" + # "@id" in files entity is format like "sample.txt" filename_mapping = "" file_url_url_mapping = "" for k, m in properties_mapping.items(): @@ -2289,24 +2390,21 @@ def dereference(keys, initial_entity=None): if file_key == "hasPart" and files_entity: del rocrate.root_dataset["hasPart"] - extracted_files = kwargs.get("extracted_files", []) + extracted_files = kwargs.get("extracted_files", []) # type: list[str] for entity in files_entity: - file_metadata = entity._jsonld + file_metadata = entity._jsonld # type: dict del file_metadata["@id"] del file_metadata["@type"] - filename = dereference(filename_mapping.split(".")[1:], entity) + filename = dereference(filename_mapping.split(".")[1:], entity) # type: str url = dereference(file_url_url_mapping.split(".")[1:], entity) entity.delete() - host_url = current_app.config["THEME_SITEURL"] + host_url = current_app.config["THEME_SITEURL"] # type: str if isinstance(url, str) and host_url not in url: rocrate.add_file(url, properties=file_metadata) else: file_metadata["wk:textExtraction"] = filename in extracted_files - rocrate.add_file( - dest_path=f"data/{filename}", - properties=file_metadata - ) + rocrate.add_file( dest_path=filename, properties=file_metadata) # Extra if "Extra" in item_map: @@ -2351,3 +2449,126 @@ def dereference(keys, initial_entity=None): rocrate.root_dataset["wk:metadataAutoFill"] = False return rocrate + + +def set_by_jsonpath(root, path, value, fixed_properties=None): + """ + Set a value inside a nested dict/list structure using a JSONPath-like syntax. + + Args: + root (dict | list): The root object to modify. + path (str): The JSONPath-like path to the location to set the value. + value: The value to set at the specified location. + fixed_properties (dict | None): + Fixed value info in the form {parent_path: {sub_key: value}}. + If the path matches when creating a dict, merge these values. + """ + tokens = [] + i = 0 + while i < len(path): + if path[i] == '.': + i += 1 + continue + if path[i] == '[': + j = path.find(']', i) + if j == -1: + raise ValueError("Unmatched '[' in path") + index_str = path[i+1:j] + if not index_str.isdigit(): + raise ValueError("Only integer indices are allowed inside []") + tokens.append(int(index_str)) + i = j + 1 + else: + j = i + while j < len(path) and path[j] not in '.[': + j += 1 + tokens.append(path[i:j]) + i = j + + if not tokens: + raise ValueError("Empty path") + + # Traverse until the second last token + cur = root + for idx in range(len(tokens) - 1): + tok = tokens[idx] + next_tok = tokens[idx + 1] + + if isinstance(tok, int): + # Current should be a list + if not isinstance(cur, list): + raise TypeError("Expected list when accessing by index") + # Extend list if necessary + while len(cur) <= tok: + if isinstance(next_tok, int): + cur.append([]) + else: + # Merge fixed properties if available + parent_path = ".".join( + [t for t in tokens[:idx+1] if not isinstance(t, int)] + ) + if fixed_properties and parent_path in fixed_properties: + d = dict(fixed_properties[parent_path]) + cur.append(d) + else: + cur.append({}) + cur = cur[tok] + else: + # Current should be a dict + if not isinstance(cur, dict): + raise TypeError("Expected dict when accessing by key") + if tok not in cur: + if isinstance(next_tok, int): + cur[tok] = [] + else: + # Merge fixed properties if available + parent_path = ".".join( + [t for t in tokens[:idx+1] if not isinstance(t, int)] + ) + if fixed_properties and parent_path in fixed_properties: + d = dict(fixed_properties[parent_path]) + cur[tok] = d + else: + cur[tok] = {} + cur = cur[tok] + + # Set the final value + last = tokens[-1] + if isinstance(last, int): + if not isinstance(cur, list): + raise TypeError("Expected list for final index") + while len(cur) <= last: + cur.append(None) + cur[last] = value + else: + if not isinstance(cur, dict): + raise TypeError("Expected dict for final key") + cur[last] = value + + +def tokenize_jsonpath(json_path): + """Tokenize the json path. + + Separate keys and indices from json path. + + Args: + json_path (str): json path. + + Returns: + list[tuple[str,int|None],str]: list of tokens (element, index). + """ + matches = re.findall(r"([^.\[]+)(?:\[(\d+)\])?\.?", json_path) + tokens = [] # type: list[tuple[str, int|None, str]] + current_path = "" + for element, index_str in matches: + if current_path: + current_path += "." + element + else: + current_path = element + + if index_str: + index = int(index_str) + else: + index = None + tokens.append((element, index, current_path)) + return tokens diff --git a/modules/weko-search-ui/weko_search_ui/translations/en/LC_MESSAGES/messages.mo b/modules/weko-search-ui/weko_search_ui/translations/en/LC_MESSAGES/messages.mo index 343b548c26..727dc9c791 100644 Binary files a/modules/weko-search-ui/weko_search_ui/translations/en/LC_MESSAGES/messages.mo and b/modules/weko-search-ui/weko_search_ui/translations/en/LC_MESSAGES/messages.mo differ diff --git a/modules/weko-search-ui/weko_search_ui/translations/en/LC_MESSAGES/messages.po b/modules/weko-search-ui/weko_search_ui/translations/en/LC_MESSAGES/messages.po index 821582acfd..92aab53922 100644 --- a/modules/weko-search-ui/weko_search_ui/translations/en/LC_MESSAGES/messages.po +++ b/modules/weko-search-ui/weko_search_ui/translations/en/LC_MESSAGES/messages.po @@ -8,102 +8,167 @@ msgid "" msgstr "" "Project-Id-Version: weko-search-ui 0.1.0.dev20170000\n" "Report-Msgid-Bugs-To: wekosoftware@nii.ac.jp\n" -"POT-Creation-Date: 2025-05-27 19:16+0900\n" +"POT-Creation-Date: 2025-11-12 12:12+0900\n" "PO-Revision-Date: 2025-04-09 23:22+0900\n" "Last-Translator: FULL NAME \n" "Language: en\n" "Language-Team: en \n" -"Plural-Forms: nplurals=2; plural=(n != 1)\n" +"Plural-Forms: nplurals=2; plural=(n != 1);\n" "MIME-Version: 1.0\n" "Content-Type: text/plain; charset=utf-8\n" "Content-Transfer-Encoding: 8bit\n" -"Generated-By: Babel 2.5.1\n" +"Generated-By: Babel 2.17.0\n" -#: tests/conftest.py:399 +#: tests/conftest.py:409 msgid "write your own license" msgstr "" -#: tests/conftest.py:404 +#: tests/conftest.py:415 msgid "Creative Commons CC0 1.0 Universal Public Domain Designation" msgstr "" -#: tests/conftest.py:420 +#: tests/conftest.py:430 msgid "Creative Commons Attribution 3.0 Unported (CC BY 3.0)" msgstr "" -#: tests/conftest.py:432 +#: tests/conftest.py:443 msgid "Creative Commons Attribution-ShareAlike 3.0 Unported (CC BY-SA 3.0)" msgstr "" -#: tests/conftest.py:447 +#: tests/conftest.py:458 msgid "Creative Commons Attribution-NoDerivs 3.0 Unported (CC BY-ND 3.0)" msgstr "" -#: tests/conftest.py:461 +#: tests/conftest.py:472 msgid "Creative Commons Attribution-NonCommercial 3.0 Unported (CC BY-NC 3.0)" msgstr "" -#: tests/conftest.py:476 +#: tests/conftest.py:487 msgid "" "Creative Commons Attribution-NonCommercial-ShareAlike 3.0 Unported (CC " "BY-NC-SA 3.0)" msgstr "" -#: tests/conftest.py:491 +#: tests/conftest.py:502 msgid "" "Creative Commons Attribution-NonCommercial-NoDerivs 3.0 Unported (CC BY-" "NC-ND 3.0)" msgstr "" -#: tests/conftest.py:507 +#: tests/conftest.py:517 msgid "Creative Commons Attribution 4.0 International (CC BY 4.0)" msgstr "" -#: tests/conftest.py:519 +#: tests/conftest.py:530 msgid "Creative Commons Attribution-ShareAlike 4.0 International (CC BY-SA 4.0)" msgstr "" -#: tests/conftest.py:534 +#: tests/conftest.py:545 msgid "" "Creative Commons Attribution-NoDerivatives 4.0 International (CC BY-ND " "4.0)" msgstr "" -#: tests/conftest.py:549 +#: tests/conftest.py:560 msgid "" "Creative Commons Attribution-NonCommercial 4.0 International (CC BY-NC " "4.0)" msgstr "" -#: tests/conftest.py:564 +#: tests/conftest.py:575 msgid "" "Creative Commons Attribution-NonCommercial-ShareAlike 4.0 International " "(CC BY-NC-SA 4.0)" msgstr "" -#: tests/conftest.py:579 +#: tests/conftest.py:590 msgid "" "Creative Commons Attribution-NonCommercial-NoDerivatives 4.0 " "International (CC BY-NC-ND 4.0)" msgstr "" -#: weko_search_ui/admin.py:158 +#: tests/helpers.py:84 +msgid "Bagging a parent of the current directory is not supported" +msgstr "" + +#: tests/helpers.py:87 +#, python-format +msgid "Creating tag for directory %s" +msgstr "" + +#: tests/helpers.py:90 tests/helpers.py:91 +#, python-format +msgid "Bag directory %s does not exist" +msgstr "" + +#: tests/helpers.py:96 tests/helpers.py:97 +#, python-format +msgid "Bag directory %s does not contain a data directory" +msgstr "" + +#: tests/helpers.py:104 +#, python-format +msgid "" +"Unable to write to the following directories and files:\n" +"%s" +msgstr "" + +#: tests/helpers.py:107 +msgid "Missing permissions to move all files and directories" +msgstr "" + +#: tests/helpers.py:114 +#, python-format +msgid "" +"The following directories do not have read permissions:\n" +"%s" +msgstr "" + +#: tests/helpers.py:119 +#, python-format +msgid "" +"The following files do not have read permissions:\n" +"%s" +msgstr "" + +#: tests/helpers.py:123 +msgid "Read permissions are required to calculate file fixities" +msgstr "" + +#: tests/helpers.py:126 +msgid "Creating data directory" +msgstr "" + +#: tests/helpers.py:143 +msgid "Creating bagit.txt" +msgstr "" + +#: tests/helpers.py:148 +msgid "Creating bag-info.txt" +msgstr "" + +#: tests/helpers.py:167 +#, python-format +msgid "An error occurred creating a bag in %s" +msgstr "" + +#: weko_search_ui/admin.py:157 msgid "The following item(s) cannot be deleted." msgstr "" -#: weko_search_ui/admin.py:163 +#: weko_search_ui/admin.py:162 msgid "DOI granting item(s):" msgstr "" -#: weko_search_ui/admin.py:168 +#: weko_search_ui/admin.py:167 msgid "Editing item(s):" msgstr "" -#: weko_search_ui/admin.py:171 +#: weko_search_ui/admin.py:170 msgid "Success" msgstr "" -#: weko_search_ui/admin.py:204 +#: weko_search_ui/admin.py:203 msgid "Index Delete is in progress on another device." msgstr "" @@ -114,27 +179,27 @@ msgid "" "you want to continue deleting items that are not grant DOI?" msgstr "" -#: weko_search_ui/admin.py:216 +#: weko_search_ui/admin.py:215 msgid "Are you sure you want to delete it?" msgstr "Are you sure you want to discard the input contents?" -#: weko_search_ui/admin.py:219 +#: weko_search_ui/admin.py:218 msgid "No such index." msgstr "" -#: weko_search_ui/admin.py:310 weko_search_ui/admin.py:1243 +#: weko_search_ui/admin.py:309 weko_search_ui/admin.py:1250 msgid "Custom Sort" msgstr "" -#: weko_search_ui/admin.py:312 weko_search_ui/admin.py:1234 +#: weko_search_ui/admin.py:311 weko_search_ui/admin.py:1241 msgid "Bulk Delete" msgstr "" -#: weko_search_ui/admin.py:325 +#: weko_search_ui/admin.py:324 msgid "Bulk Update" msgstr "" -#: weko_search_ui/admin.py:440 weko_search_ui/admin.py:868 +#: weko_search_ui/admin.py:439 weko_search_ui/admin.py:872 #: weko_search_ui/templates/weko_search_ui/admin/export.html:53 #: weko_search_ui/templates/weko_search_ui/admin/import.html:96 #: weko_search_ui/templates/weko_search_ui/admin/rocrate_import.html:97 @@ -142,29 +207,29 @@ msgstr "" msgid "Internal server error" msgstr "" -#: weko_search_ui/admin.py:1225 weko_search_ui/admin.py:1242 +#: weko_search_ui/admin.py:1232 weko_search_ui/admin.py:1249 #: weko_search_ui/templates/weko_search_ui/admin/import.html:53 #: weko_search_ui/templates/weko_search_ui/admin/rocrate_import.html:54 msgid "Index Tree" msgstr "" -#: weko_search_ui/admin.py:1233 weko_search_ui/admin.py:1251 -#: weko_search_ui/admin.py:1260 weko_search_ui/admin.py:1270 +#: weko_search_ui/admin.py:1240 weko_search_ui/admin.py:1258 +#: weko_search_ui/admin.py:1267 weko_search_ui/admin.py:1277 msgid "Items" msgstr "" -#: weko_search_ui/admin.py:1252 +#: weko_search_ui/admin.py:1259 #: weko_search_ui/templates/weko_search_ui/admin/import.html:42 #: weko_search_ui/templates/weko_search_ui/admin/rocrate_import.html:43 msgid "Import" msgstr "" -#: weko_search_ui/admin.py:1261 +#: weko_search_ui/admin.py:1268 #: weko_search_ui/templates/weko_search_ui/admin/rocrate_import.html:42 msgid "RO-Crate Import" msgstr "" -#: weko_search_ui/admin.py:1271 +#: weko_search_ui/admin.py:1278 msgid "Bulk Export" msgstr "" @@ -172,23 +237,53 @@ msgstr "" msgid "contents" msgstr "" -#: weko_search_ui/mapper.py:1360 +#: weko_search_ui/mapper.py:1375 +#, python-brace-format msgid "\"{key}\" is required." msgstr "" -#: weko_search_ui/mapper.py:1381 +#: weko_search_ui/mapper.py:1396 +#, python-brace-format msgid "\"{key}\" is not in itemtype." msgstr "" -#: weko_search_ui/mapper.py:1383 +#: weko_search_ui/mapper.py:1398 +#, python-brace-format msgid "\"{key}\" is not in itemtype, did you mean \"{similar_key}\"?" msgstr "" -#: weko_search_ui/tasks.py:328 +#: weko_search_ui/mapper.py:1517 +#, python-format +msgid "" +"Cannot map to item type from json-ld; Mapping is not defined for the " +"metadata, \"%(key)s\": \"%(value)s\"" +msgstr "" + +#: weko_search_ui/mapper.py:1543 +#, python-format +msgid "" +"Cannot map to item type from json-ld; Not found mapping destination for " +"the metadata, \"%(key)s\": \"%(value)s\"" +msgstr "" + +#: weko_search_ui/mapper.py:1553 +#, python-format +msgid "Failed to set metadata for json-ld, \"%(key)s\": \"%(value)s\"" +msgstr "" + +#: weko_search_ui/mapper.py:1572 +msgid "Metadata which could not be mapped to item type will be set in 'Extra'." +msgstr "" + +#: weko_search_ui/mapper.py:1576 +msgid "Metadata which could not be mapped to item type will be discarded." +msgstr "" + +#: weko_search_ui/tasks.py:337 msgid "`wk:metadata_replace` flag cannot be used in RO-Crate Import." msgstr "" -#: weko_search_ui/tasks.py:343 +#: weko_search_ui/tasks.py:352 msgid "`wk:isSplited` flag cannot be used in RO-Crate Import." msgstr "" @@ -196,25 +291,28 @@ msgstr "" msgid "The same item may have been registered." msgstr "" -#: weko_search_ui/utils.py:592 weko_search_ui/utils.py:708 +#: weko_search_ui/utils.py:593 weko_search_ui/utils.py:709 +#, python-brace-format msgid "" "The format of the specified file {} does not support import. Please " "specify one of the following formats: zip, tar, gztar, bztar, xztar." msgstr "" -#: weko_search_ui/utils.py:600 +#: weko_search_ui/utils.py:601 +#, python-brace-format msgid "" "The csv/tsv file was not found in the specified file {}. Check if the " "directory structure is correct." msgstr "" -#: weko_search_ui/utils.py:649 +#: weko_search_ui/utils.py:650 msgid "" "The item type of the item to be imported is missing or has already been " "deleted." msgstr "" -#: weko_search_ui/utils.py:715 +#: weko_search_ui/utils.py:716 +#, python-brace-format msgid "" "The xml file was not found in the specified file {}. Check if the " "directory structure is correct." @@ -224,268 +322,305 @@ msgstr "" msgid "The item type ID specified in the XML file does not exist." msgstr "" -#: weko_search_ui/utils.py:1215 +#: weko_search_ui/utils.py:1206 +#, python-brace-format msgid "" "There is an error in the format of the first line of the header of the {}" " file." msgstr "" -#: weko_search_ui/utils.py:1234 +#: weko_search_ui/utils.py:1225 +#, python-brace-format msgid "The item type ID specified in the {} file does not exist." msgstr "" -#: weko_search_ui/utils.py:1243 +#: weko_search_ui/utils.py:1236 msgid "Cannot register because the specified item type is not the latest version." msgstr "" -#: weko_search_ui/utils.py:1258 +#: weko_search_ui/utils.py:1250 +#, python-brace-format msgid "The following metadata keys are duplicated.
{}" msgstr "" -#: weko_search_ui/utils.py:1281 +#: weko_search_ui/utils.py:1274 +#, python-brace-format msgid "The item does not consistent with the specified item type.
{}" msgstr "" -#: weko_search_ui/utils.py:1311 +#: weko_search_ui/utils.py:1303 +#, python-brace-format msgid "Cannot read {} file correctly." msgstr "" -#: weko_search_ui/utils.py:1331 +#: weko_search_ui/utils.py:1328 +#, python-brace-format msgid "" "The following items are not registered because they do not exist in the " "specified item type. {}" msgstr "" -#: weko_search_ui/utils.py:1341 +#: weko_search_ui/utils.py:1336 +#, python-brace-format msgid "" "The {} file could not be read. Make sure the file format is {} and that " "the file is UTF-8 encoded." msgstr "" -#: weko_search_ui/utils.py:1372 +#: weko_search_ui/utils.py:1369 msgid "" "The XML file could not be read. Make sure the file format is XML and that" " the file is UTF-8 encoded." msgstr "" -#: weko_search_ui/utils.py:1444 +#: weko_search_ui/utils.py:1441 msgid "Please specify item ID by half-width number." msgstr "" -#: weko_search_ui/utils.py:1459 +#: weko_search_ui/utils.py:1462 +#, python-format +msgid "Replace value of %(target_path)s from %(old_value)s to '%(new_value)s'." +msgstr "" + +#: weko_search_ui/utils.py:1475 msgid "Specified item type does not exist." msgstr "" -#: weko_search_ui/utils.py:1533 +#: weko_search_ui/utils.py:1481 +#, python-format +msgid "Specified %(type)s is different from existing %(existing_type)s." +msgstr "" + +#: weko_search_ui/utils.py:1556 msgid "Specified URI and system URI do not match." msgstr "" -#: weko_search_ui/utils.py:1545 +#: weko_search_ui/utils.py:1568 msgid "Item does not exist in the system." msgstr "" -#: weko_search_ui/utils.py:1552 +#: weko_search_ui/utils.py:1575 msgid "Item already DELETED in the system." msgstr "" -#: weko_search_ui/utils.py:1569 +#: weko_search_ui/utils.py:1592 msgid "Please specify either \"Keep\" or \"Upgrade\"." msgstr "" -#: weko_search_ui/utils.py:2472 +#: weko_search_ui/utils.py:2508 msgid "Title is required item." msgstr "" -#: weko_search_ui/utils.py:2489 +#: weko_search_ui/utils.py:2525 +#, python-brace-format msgid "{} is required item." msgstr "" -#: weko_search_ui/utils.py:2492 +#: weko_search_ui/utils.py:2528 +#, python-brace-format msgid "Please set \"public\" or \"private\" for {}." msgstr "" -#: weko_search_ui/utils.py:2533 +#: weko_search_ui/utils.py:2569 +#, python-brace-format msgid "The specified {} does not exist in system." msgstr "" -#: weko_search_ui/utils.py:2543 +#: weko_search_ui/utils.py:2579 +#, python-brace-format msgid "Specified {} does not match with existing index." msgstr "" -#: weko_search_ui/utils.py:2587 +#: weko_search_ui/utils.py:2623 msgid "Your role cannot register items in this index." msgstr "" -#: weko_search_ui/utils.py:2608 +#: weko_search_ui/utils.py:2644 msgid "Both of IndexID and POS_INDEX are not being set." msgstr "" -#: weko_search_ui/utils.py:2654 weko_search_ui/utils.py:2679 +#: weko_search_ui/utils.py:2690 weko_search_ui/utils.py:2715 +#, python-brace-format msgid "Specified {} is invalid." msgstr "" -#: weko_search_ui/utils.py:2721 weko_search_ui/utils.py:2754 -#: weko_search_ui/utils.py:2846 weko_search_ui/utils.py:2916 -#: weko_search_ui/utils.py:2920 weko_search_ui/utils.py:2942 -#: weko_search_ui/utils.py:2966 +#: weko_search_ui/utils.py:2757 weko_search_ui/utils.py:2790 +#: weko_search_ui/utils.py:2882 weko_search_ui/utils.py:2952 +#: weko_search_ui/utils.py:2956 weko_search_ui/utils.py:2978 +#: weko_search_ui/utils.py:3002 +#, python-brace-format msgid "Please specify {}." msgstr "" -#: weko_search_ui/utils.py:2724 weko_search_ui/utils.py:2923 +#: weko_search_ui/utils.py:2760 weko_search_ui/utils.py:2960 +#, python-brace-format msgid "The specified {} exceeds the maximum length." msgstr "" -#: weko_search_ui/utils.py:2739 weko_search_ui/utils.py:2897 -#: weko_search_ui/utils.py:2907 weko_search_ui/utils.py:2938 +#: weko_search_ui/utils.py:2775 weko_search_ui/utils.py:2933 +#: weko_search_ui/utils.py:2943 weko_search_ui/utils.py:2974 +#, python-brace-format msgid "Specified Prefix of {} is incorrect." msgstr "" -#: weko_search_ui/utils.py:2747 weko_search_ui/utils.py:2891 -#: weko_search_ui/utils.py:2900 +#: weko_search_ui/utils.py:2783 weko_search_ui/utils.py:2927 +#: weko_search_ui/utils.py:2936 +#, python-brace-format msgid "{} cannot be set." msgstr "" -#: weko_search_ui/utils.py:2756 weko_search_ui/utils.py:2760 -#: weko_search_ui/utils.py:2829 weko_search_ui/utils.py:2968 +#: weko_search_ui/utils.py:2793 weko_search_ui/utils.py:2797 +#: weko_search_ui/utils.py:2865 weko_search_ui/utils.py:3005 +#, python-brace-format msgid "Specified {} is different from existing {}." msgstr "" -#: weko_search_ui/utils.py:2780 +#: weko_search_ui/utils.py:2817 msgid "" "When assigning a DOI to an item, it must be associated with an index " "whose index status is \"Public\" and Harvest Publishing is \"Public\"." msgstr "" -#: weko_search_ui/utils.py:2785 +#: weko_search_ui/utils.py:2822 msgid "" "Since the item has a DOI, it must be associated with an index whose index" " status is \"Public\" and whose Harvest Publishing is \"Public\"." msgstr "" -#: weko_search_ui/utils.py:2796 +#: weko_search_ui/utils.py:2832 msgid "You cannot keep an item private because it has a DOI." msgstr "" -#: weko_search_ui/utils.py:2850 weko_search_ui/utils.py:4070 +#: weko_search_ui/utils.py:2887 weko_search_ui/utils.py:4106 msgid "DOI_RA should be set by one of JaLC, Crossref, DataCite, NDL JaLC." msgstr "" -#: weko_search_ui/utils.py:3001 +#: weko_search_ui/utils.py:3037 +#, python-brace-format msgid "Item Link type: '{}' is not one of {}." msgstr "" -#: weko_search_ui/utils.py:3005 +#: weko_search_ui/utils.py:3041 msgid "Please specify Item URL for item link." msgstr "" -#: weko_search_ui/utils.py:3019 +#: weko_search_ui/utils.py:3055 msgid "Specified Item Link URI and system URI do not match." msgstr "" -#: weko_search_ui/utils.py:3025 +#: weko_search_ui/utils.py:3061 msgid "Linking item does not exist in the system." msgstr "" -#: weko_search_ui/utils.py:3028 +#: weko_search_ui/utils.py:3064 msgid "Linking item already deleted in the system." msgstr "" -#: weko_search_ui/utils.py:3067 +#: weko_search_ui/utils.py:3103 msgid "It is not allowed to create links to the item itself." msgstr "" -#: weko_search_ui/utils.py:3072 +#: weko_search_ui/utils.py:3108 +#, python-brace-format msgid "It is not allowed to create links other than {} between split items." msgstr "" -#: weko_search_ui/utils.py:3108 +#: weko_search_ui/utils.py:3144 msgid "Duplicate Item Link." msgstr "" -#: weko_search_ui/utils.py:3447 +#: weko_search_ui/utils.py:3483 +#, python-brace-format msgid "" "One of the following required values ​​has not been " "registered.
{}
" msgstr "" -#: weko_search_ui/utils.py:3452 +#: weko_search_ui/utils.py:3489 +#, python-brace-format msgid "" "The mapping of required items for DOI validation is not set. Please " "recheck the following mapping settings.
{}" msgstr "" -#: weko_search_ui/utils.py:3462 +#: weko_search_ui/utils.py:3498 +#, python-brace-format msgid "The following metadata are required.
{}" msgstr "" -#: weko_search_ui/utils.py:3467 +#: weko_search_ui/utils.py:3504 +#, python-brace-format msgid "One of the following metadata is required.
{}
" msgstr "" -#: weko_search_ui/utils.py:3530 weko_search_ui/utils.py:3542 +#: weko_search_ui/utils.py:3567 weko_search_ui/utils.py:3579 msgid "Please specify the date with any format of YYYY-MM-DD, YYYY-MM, YYYY." msgstr "" -#: weko_search_ui/utils.py:3536 +#: weko_search_ui/utils.py:3572 +#, python-brace-format msgid "Replace value of {} from {} to {}." msgstr "" -#: weko_search_ui/utils.py:3559 +#: weko_search_ui/utils.py:3595 msgid "Please specify PubDate with YYYY-MM-DD." msgstr "" -#: weko_search_ui/utils.py:3589 +#: weko_search_ui/utils.py:3625 msgid "ID is specified for the newly registered item. Ignore the ID and register." msgstr "" -#: weko_search_ui/utils.py:3672 +#: weko_search_ui/utils.py:3708 msgid "Please specify Open Access Date with YYYY-MM-DD." msgstr "" -#: weko_search_ui/utils.py:3909 weko_search_ui/utils.py:4055 -#: weko_search_ui/utils.py:4061 +#: weko_search_ui/utils.py:3945 weko_search_ui/utils.py:4091 +#: weko_search_ui/utils.py:4097 msgid "Please specify DOI prefix/suffix." msgstr "" -#: weko_search_ui/utils.py:4047 +#: weko_search_ui/utils.py:4083 msgid "The specified DOI is wrong and fixed with the registered DOI." msgstr "" -#: weko_search_ui/utils.py:4050 +#: weko_search_ui/utils.py:4086 msgid "" "The specified DOI RA is wrong and fixed with the correct DOI RA of the " "registered DOI." msgstr "" -#: weko_search_ui/utils.py:4057 weko_search_ui/utils.py:4063 +#: weko_search_ui/utils.py:4093 weko_search_ui/utils.py:4099 msgid "Please specify DOI suffix." msgstr "" -#: weko_search_ui/utils.py:4066 +#: weko_search_ui/utils.py:4102 msgid "Do not specify DOI suffix." msgstr "" -#: weko_search_ui/utils.py:4072 +#: weko_search_ui/utils.py:4108 msgid "Specified Prefix of DOI is incorrect." msgstr "" -#: weko_search_ui/utils.py:4104 +#: weko_search_ui/utils.py:4141 msgid "" "Please specify the image file(gif, jpg, jpe, jpeg, png, bmp, tiff, tif) " "for the thumbnail." msgstr "" -#: weko_search_ui/utils.py:5220 +#: weko_search_ui/utils.py:5256 +#, python-brace-format msgid "The file specified in ({}) does not exist." msgstr "" -#: weko_search_ui/utils.py:5224 +#: weko_search_ui/utils.py:5261 +#, python-brace-format msgid "" "The file specified in ({}) does not exist.
The file will not be " "updated. Update only the metadata with csv/tsv contents." msgstr "" -#: weko_search_ui/utils.py:5511 +#: weko_search_ui/utils.py:5547 +#, python-brace-format msgid "The file name specified in {} and {} do not match." msgstr "" diff --git a/modules/weko-search-ui/weko_search_ui/translations/ja/LC_MESSAGES/messages.mo b/modules/weko-search-ui/weko_search_ui/translations/ja/LC_MESSAGES/messages.mo index 2b124cce9d..fbc36b019c 100644 Binary files a/modules/weko-search-ui/weko_search_ui/translations/ja/LC_MESSAGES/messages.mo and b/modules/weko-search-ui/weko_search_ui/translations/ja/LC_MESSAGES/messages.mo differ diff --git a/modules/weko-search-ui/weko_search_ui/translations/ja/LC_MESSAGES/messages.po b/modules/weko-search-ui/weko_search_ui/translations/ja/LC_MESSAGES/messages.po index 8a47f9a05d..c7dce7d302 100644 --- a/modules/weko-search-ui/weko_search_ui/translations/ja/LC_MESSAGES/messages.po +++ b/modules/weko-search-ui/weko_search_ui/translations/ja/LC_MESSAGES/messages.po @@ -8,102 +8,167 @@ msgid "" msgstr "" "Project-Id-Version: weko-search-ui 0.1.0.dev20170000\n" "Report-Msgid-Bugs-To: wekosoftware@nii.ac.jp\n" -"POT-Creation-Date: 2025-05-27 19:16+0900\n" +"POT-Creation-Date: 2025-11-12 12:12+0900\n" "PO-Revision-Date: 2025-04-09 22:35+0900\n" "Last-Translator: FULL NAME \n" "Language: ja\n" "Language-Team: ja \n" -"Plural-Forms: nplurals=1; plural=0\n" +"Plural-Forms: nplurals=1; plural=0;\n" "MIME-Version: 1.0\n" "Content-Type: text/plain; charset=utf-8\n" "Content-Transfer-Encoding: 8bit\n" -"Generated-By: Babel 2.5.1\n" +"Generated-By: Babel 2.17.0\n" -#: tests/conftest.py:399 +#: tests/conftest.py:409 msgid "write your own license" msgstr "" -#: tests/conftest.py:404 +#: tests/conftest.py:415 msgid "Creative Commons CC0 1.0 Universal Public Domain Designation" msgstr "" -#: tests/conftest.py:420 +#: tests/conftest.py:430 msgid "Creative Commons Attribution 3.0 Unported (CC BY 3.0)" msgstr "" -#: tests/conftest.py:432 +#: tests/conftest.py:443 msgid "Creative Commons Attribution-ShareAlike 3.0 Unported (CC BY-SA 3.0)" msgstr "" -#: tests/conftest.py:447 +#: tests/conftest.py:458 msgid "Creative Commons Attribution-NoDerivs 3.0 Unported (CC BY-ND 3.0)" msgstr "" -#: tests/conftest.py:461 +#: tests/conftest.py:472 msgid "Creative Commons Attribution-NonCommercial 3.0 Unported (CC BY-NC 3.0)" msgstr "" -#: tests/conftest.py:476 +#: tests/conftest.py:487 msgid "" "Creative Commons Attribution-NonCommercial-ShareAlike 3.0 Unported (CC " "BY-NC-SA 3.0)" msgstr "" -#: tests/conftest.py:491 +#: tests/conftest.py:502 msgid "" "Creative Commons Attribution-NonCommercial-NoDerivs 3.0 Unported (CC BY-" "NC-ND 3.0)" msgstr "" -#: tests/conftest.py:507 +#: tests/conftest.py:517 msgid "Creative Commons Attribution 4.0 International (CC BY 4.0)" msgstr "" -#: tests/conftest.py:519 +#: tests/conftest.py:530 msgid "Creative Commons Attribution-ShareAlike 4.0 International (CC BY-SA 4.0)" msgstr "" -#: tests/conftest.py:534 +#: tests/conftest.py:545 msgid "" "Creative Commons Attribution-NoDerivatives 4.0 International (CC BY-ND " "4.0)" msgstr "" -#: tests/conftest.py:549 +#: tests/conftest.py:560 msgid "" "Creative Commons Attribution-NonCommercial 4.0 International (CC BY-NC " "4.0)" msgstr "" -#: tests/conftest.py:564 +#: tests/conftest.py:575 msgid "" "Creative Commons Attribution-NonCommercial-ShareAlike 4.0 International " "(CC BY-NC-SA 4.0)" msgstr "" -#: tests/conftest.py:579 +#: tests/conftest.py:590 msgid "" "Creative Commons Attribution-NonCommercial-NoDerivatives 4.0 " "International (CC BY-NC-ND 4.0)" msgstr "" -#: weko_search_ui/admin.py:158 +#: tests/helpers.py:84 +msgid "Bagging a parent of the current directory is not supported" +msgstr "" + +#: tests/helpers.py:87 +#, python-format +msgid "Creating tag for directory %s" +msgstr "" + +#: tests/helpers.py:90 tests/helpers.py:91 +#, python-format +msgid "Bag directory %s does not exist" +msgstr "" + +#: tests/helpers.py:96 tests/helpers.py:97 +#, python-format +msgid "Bag directory %s does not contain a data directory" +msgstr "" + +#: tests/helpers.py:104 +#, python-format +msgid "" +"Unable to write to the following directories and files:\n" +"%s" +msgstr "" + +#: tests/helpers.py:107 +msgid "Missing permissions to move all files and directories" +msgstr "" + +#: tests/helpers.py:114 +#, python-format +msgid "" +"The following directories do not have read permissions:\n" +"%s" +msgstr "" + +#: tests/helpers.py:119 +#, python-format +msgid "" +"The following files do not have read permissions:\n" +"%s" +msgstr "" + +#: tests/helpers.py:123 +msgid "Read permissions are required to calculate file fixities" +msgstr "" + +#: tests/helpers.py:126 +msgid "Creating data directory" +msgstr "" + +#: tests/helpers.py:143 +msgid "Creating bagit.txt" +msgstr "" + +#: tests/helpers.py:148 +msgid "Creating bag-info.txt" +msgstr "" + +#: tests/helpers.py:167 +#, python-format +msgid "An error occurred creating a bag in %s" +msgstr "" + +#: weko_search_ui/admin.py:157 msgid "The following item(s) cannot be deleted." msgstr "以下のアイテムを削除することはできませんでした。" -#: weko_search_ui/admin.py:163 +#: weko_search_ui/admin.py:162 msgid "DOI granting item(s):" msgstr "DOI付与済みのアイテム:" -#: weko_search_ui/admin.py:168 +#: weko_search_ui/admin.py:167 msgid "Editing item(s):" msgstr "編集中のアイテム:" -#: weko_search_ui/admin.py:171 +#: weko_search_ui/admin.py:170 msgid "Success" msgstr "" -#: weko_search_ui/admin.py:204 +#: weko_search_ui/admin.py:203 msgid "Index Delete is in progress on another device." msgstr "" @@ -114,27 +179,27 @@ msgid "" "you want to continue deleting items that are not grant DOI?" msgstr "削除対象にDOI付与済みアイテムが含まれています。
DOI付与済みアイテムはDOI取下げを行わないと削除できません。
DOI付与済み以外のアイテム削除を続行しますか?" -#: weko_search_ui/admin.py:216 +#: weko_search_ui/admin.py:215 msgid "Are you sure you want to delete it?" msgstr "削除してよろしいですか?" -#: weko_search_ui/admin.py:219 +#: weko_search_ui/admin.py:218 msgid "No such index." msgstr "" -#: weko_search_ui/admin.py:310 weko_search_ui/admin.py:1243 +#: weko_search_ui/admin.py:309 weko_search_ui/admin.py:1250 msgid "Custom Sort" msgstr "カスタムソート" -#: weko_search_ui/admin.py:312 weko_search_ui/admin.py:1234 +#: weko_search_ui/admin.py:311 weko_search_ui/admin.py:1241 msgid "Bulk Delete" msgstr "一括削除" -#: weko_search_ui/admin.py:325 +#: weko_search_ui/admin.py:324 msgid "Bulk Update" msgstr "一括更新" -#: weko_search_ui/admin.py:440 weko_search_ui/admin.py:868 +#: weko_search_ui/admin.py:439 weko_search_ui/admin.py:872 #: weko_search_ui/templates/weko_search_ui/admin/export.html:53 #: weko_search_ui/templates/weko_search_ui/admin/import.html:96 #: weko_search_ui/templates/weko_search_ui/admin/rocrate_import.html:97 @@ -142,29 +207,29 @@ msgstr "一括更新" msgid "Internal server error" msgstr "サーバ内部エラー" -#: weko_search_ui/admin.py:1225 weko_search_ui/admin.py:1242 +#: weko_search_ui/admin.py:1232 weko_search_ui/admin.py:1249 #: weko_search_ui/templates/weko_search_ui/admin/import.html:53 #: weko_search_ui/templates/weko_search_ui/admin/rocrate_import.html:54 msgid "Index Tree" msgstr "インデックスツリー" -#: weko_search_ui/admin.py:1233 weko_search_ui/admin.py:1251 -#: weko_search_ui/admin.py:1260 weko_search_ui/admin.py:1270 +#: weko_search_ui/admin.py:1240 weko_search_ui/admin.py:1258 +#: weko_search_ui/admin.py:1267 weko_search_ui/admin.py:1277 msgid "Items" msgstr "アイテム" -#: weko_search_ui/admin.py:1252 +#: weko_search_ui/admin.py:1259 #: weko_search_ui/templates/weko_search_ui/admin/import.html:42 #: weko_search_ui/templates/weko_search_ui/admin/rocrate_import.html:43 msgid "Import" msgstr "インポート" -#: weko_search_ui/admin.py:1261 +#: weko_search_ui/admin.py:1268 #: weko_search_ui/templates/weko_search_ui/admin/rocrate_import.html:42 msgid "RO-Crate Import" msgstr "RO-Crate インポート" -#: weko_search_ui/admin.py:1271 +#: weko_search_ui/admin.py:1278 msgid "Bulk Export" msgstr "一括エクスポート" @@ -172,23 +237,53 @@ msgstr "一括エクスポート" msgid "contents" msgstr "" -#: weko_search_ui/mapper.py:1360 +#: weko_search_ui/mapper.py:1375 +#, python-brace-format msgid "\"{key}\" is required." msgstr "「{key}」 に対応するマッピングが必要です。" -#: weko_search_ui/mapper.py:1381 +#: weko_search_ui/mapper.py:1396 +#, python-brace-format msgid "\"{key}\" is not in itemtype." msgstr "「{key}」 はアイテムタイプに存在しません。" -#: weko_search_ui/mapper.py:1383 +#: weko_search_ui/mapper.py:1398 +#, python-brace-format msgid "\"{key}\" is not in itemtype, did you mean \"{similar_key}\"?" msgstr "「{key}」 はアイテムタイプに存在しません。「{similar_key}」であれば存在します。" -#: weko_search_ui/tasks.py:328 +#: weko_search_ui/mapper.py:1517 +#, python-format +msgid "" +"Cannot map to item type from json-ld; Mapping is not defined for the " +"metadata, \"%(key)s\": \"%(value)s\"" +msgstr "対応するマッピングが定義されてないため、このメタデータはアイテムタイプに変換できません。\"%(key)s\": \"%(value)s\"" + +#: weko_search_ui/mapper.py:1543 +#, python-format +msgid "" +"Cannot map to item type from json-ld; Not found mapping destination for " +"the metadata, \"%(key)s\": \"%(value)s\"" +msgstr "マッピング先が見つからないため、このメタデータはアイテムタイプに変換できません。\"%(key)s\": \"%(value)s\"" + +#: weko_search_ui/mapper.py:1553 +#, python-format +msgid "Failed to set metadata for json-ld, \"%(key)s\": \"%(value)s\"" +msgstr "アイテムタイプへのマッピングに失敗しました。\"%(key)s\": \"%(value)s\"" + +#: weko_search_ui/mapper.py:1572 +msgid "Metadata which could not be mapped to item type will be set in 'Extra'." +msgstr "アイテムタイプにマッピングできなかったメタデータは、「Extra」プロパティに登録されます。" + +#: weko_search_ui/mapper.py:1576 +msgid "Metadata which could not be mapped to item type will be discarded." +msgstr "アイテムタイプにマッピングできなかったメタデータは破棄されます。" + +#: weko_search_ui/tasks.py:337 msgid "`wk:metadata_replace` flag cannot be used in RO-Crate Import." msgstr "RO-Crate インポートでは、`wk:metadata_replace`フラグを有効にできません。" -#: weko_search_ui/tasks.py:343 +#: weko_search_ui/tasks.py:352 msgid "`wk:isSplited` flag cannot be used in RO-Crate Import." msgstr "RO-Crate インポートでは、`wk:isSplited`フラグを有効にできません。" @@ -196,25 +291,28 @@ msgstr "RO-Crate インポートでは、`wk:isSplited`フラグを有効にで msgid "The same item may have been registered." msgstr "同じアイテムが登録されている可能性があります。" -#: weko_search_ui/utils.py:592 weko_search_ui/utils.py:708 +#: weko_search_ui/utils.py:593 weko_search_ui/utils.py:709 +#, python-brace-format msgid "" "The format of the specified file {} does not support import. Please " "specify one of the following formats: zip, tar, gztar, bztar, xztar." msgstr "指定されたファイル{}の形式はインポートに対応していません。zip,tar,gztar,bztar,xztarいずれかの形式を指定してください。" -#: weko_search_ui/utils.py:600 +#: weko_search_ui/utils.py:601 +#, python-brace-format msgid "" "The csv/tsv file was not found in the specified file {}. Check if the " "directory structure is correct." msgstr "指定されたファイル{}にtsv/csvファイルが見つかりませんでした。ディレクトリ構成が正しいか確認してください。" -#: weko_search_ui/utils.py:649 +#: weko_search_ui/utils.py:650 msgid "" "The item type of the item to be imported is missing or has already been " "deleted." msgstr "" -#: weko_search_ui/utils.py:715 +#: weko_search_ui/utils.py:716 +#, python-brace-format msgid "" "The xml file was not found in the specified file {}. Check if the " "directory structure is correct." @@ -224,268 +322,305 @@ msgstr "" msgid "The item type ID specified in the XML file does not exist." msgstr "" -#: weko_search_ui/utils.py:1215 +#: weko_search_ui/utils.py:1206 +#, python-brace-format msgid "" "There is an error in the format of the first line of the header of the {}" " file." msgstr "{}ファイルのヘッダ1行目の形式に誤りがあります。" -#: weko_search_ui/utils.py:1234 +#: weko_search_ui/utils.py:1225 +#, python-brace-format msgid "The item type ID specified in the {} file does not exist." msgstr "{}ファイルで指定されたアイテムタイプIDは存在しません。" -#: weko_search_ui/utils.py:1243 +#: weko_search_ui/utils.py:1236 msgid "Cannot register because the specified item type is not the latest version." msgstr "指定されたアイテムタイプが最新のバージョンでないため登録できません。" -#: weko_search_ui/utils.py:1258 +#: weko_search_ui/utils.py:1250 +#, python-brace-format msgid "The following metadata keys are duplicated.
{}" msgstr "以下のメタデータキーが重複しています。
{}" -#: weko_search_ui/utils.py:1281 +#: weko_search_ui/utils.py:1274 +#, python-brace-format msgid "The item does not consistent with the specified item type.
{}" msgstr "指定されたアイテムタイプと項目が一致しません。
{}" -#: weko_search_ui/utils.py:1311 +#: weko_search_ui/utils.py:1303 +#, python-brace-format msgid "Cannot read {} file correctly." msgstr "{}ファイルが正しく読み込めません。" -#: weko_search_ui/utils.py:1331 +#: weko_search_ui/utils.py:1328 +#, python-brace-format msgid "" "The following items are not registered because they do not exist in the " "specified item type. {}" msgstr "次の項目指定されたアイテムタイプに存在しないため登録されません。{}" -#: weko_search_ui/utils.py:1341 +#: weko_search_ui/utils.py:1336 +#, python-brace-format msgid "" "The {} file could not be read. Make sure the file format is {} and that " "the file is UTF-8 encoded." msgstr "{}ファイルを読み込めませんでした。ファイル形式が{}であること、またそのファイルがUTF-8でエンコードされているかを確認してください。" -#: weko_search_ui/utils.py:1372 +#: weko_search_ui/utils.py:1369 msgid "" "The XML file could not be read. Make sure the file format is XML and that" " the file is UTF-8 encoded." msgstr "" -#: weko_search_ui/utils.py:1444 +#: weko_search_ui/utils.py:1441 msgid "Please specify item ID by half-width number." msgstr "アイテムIDは半角数字で指定してください。" -#: weko_search_ui/utils.py:1459 +#: weko_search_ui/utils.py:1462 +#, python-format +msgid "Replace value of %(target_path)s from %(old_value)s to '%(new_value)s'." +msgstr "%(target_path)sの値を%(old_value)sから'%(new_value)s'へ置き換えました。" + +#: weko_search_ui/utils.py:1475 msgid "Specified item type does not exist." msgstr "指定されたアイテムタイプが存在していません。" -#: weko_search_ui/utils.py:1533 +#: weko_search_ui/utils.py:1481 +#, python-brace-format, python-format +msgid "Specified %(type)s is different from existing %(existing_type)s." +msgstr "指定された%(type)sは登録している%(existing_type)sと異なっています。" + +#: weko_search_ui/utils.py:1556 msgid "Specified URI and system URI do not match." msgstr "指定されたURIとシステムURIが一致しません。" -#: weko_search_ui/utils.py:1545 +#: weko_search_ui/utils.py:1568 msgid "Item does not exist in the system." msgstr "アイテムがシステムに存在しません。" -#: weko_search_ui/utils.py:1552 +#: weko_search_ui/utils.py:1575 msgid "Item already DELETED in the system." msgstr "リンク先アイテムは削除済です。" -#: weko_search_ui/utils.py:1569 +#: weko_search_ui/utils.py:1592 msgid "Please specify either \"Keep\" or \"Upgrade\"." msgstr "Keep、Upgradeのいずれかを指定してください。" -#: weko_search_ui/utils.py:2472 +#: weko_search_ui/utils.py:2508 msgid "Title is required item." msgstr "タイトルは必須項目です。" -#: weko_search_ui/utils.py:2489 +#: weko_search_ui/utils.py:2525 +#, python-brace-format msgid "{} is required item." msgstr "{}は必須項目です。" -#: weko_search_ui/utils.py:2492 +#: weko_search_ui/utils.py:2528 +#, python-brace-format msgid "Please set \"public\" or \"private\" for {}." msgstr "{}はpublic,privateのいずれかを設定してください。" -#: weko_search_ui/utils.py:2533 +#: weko_search_ui/utils.py:2569 +#, python-brace-format msgid "The specified {} does not exist in system." msgstr "指定された{}はシステムに存在しません。" -#: weko_search_ui/utils.py:2543 +#: weko_search_ui/utils.py:2579 +#, python-brace-format msgid "Specified {} does not match with existing index." msgstr "指定された{}はシステムのものと一致していません。" -#: weko_search_ui/utils.py:2587 +#: weko_search_ui/utils.py:2623 msgid "Your role cannot register items in this index." msgstr "ロールの権限が足りずこのインデックスにアイテム登録ができません。" -#: weko_search_ui/utils.py:2608 +#: weko_search_ui/utils.py:2644 msgid "Both of IndexID and POS_INDEX are not being set." msgstr "IndexID, POS_INDEXがどちらも設定されていません。" -#: weko_search_ui/utils.py:2654 weko_search_ui/utils.py:2679 +#: weko_search_ui/utils.py:2690 weko_search_ui/utils.py:2715 +#, python-brace-format msgid "Specified {} is invalid." msgstr "指定された{}は不正です。" -#: weko_search_ui/utils.py:2721 weko_search_ui/utils.py:2754 -#: weko_search_ui/utils.py:2846 weko_search_ui/utils.py:2916 -#: weko_search_ui/utils.py:2920 weko_search_ui/utils.py:2942 -#: weko_search_ui/utils.py:2966 +#: weko_search_ui/utils.py:2757 weko_search_ui/utils.py:2790 +#: weko_search_ui/utils.py:2882 weko_search_ui/utils.py:2952 +#: weko_search_ui/utils.py:2956 weko_search_ui/utils.py:2978 +#: weko_search_ui/utils.py:3002 +#, python-brace-format msgid "Please specify {}." msgstr "{}を設定してください。" -#: weko_search_ui/utils.py:2724 weko_search_ui/utils.py:2923 +#: weko_search_ui/utils.py:2760 weko_search_ui/utils.py:2960 +#, python-brace-format msgid "The specified {} exceeds the maximum length." msgstr "指定された{}が最大長を超えています。" -#: weko_search_ui/utils.py:2739 weko_search_ui/utils.py:2897 -#: weko_search_ui/utils.py:2907 weko_search_ui/utils.py:2938 +#: weko_search_ui/utils.py:2775 weko_search_ui/utils.py:2933 +#: weko_search_ui/utils.py:2943 weko_search_ui/utils.py:2974 +#, python-brace-format msgid "Specified Prefix of {} is incorrect." msgstr "指定された{}のPrefixが誤っています。" -#: weko_search_ui/utils.py:2747 weko_search_ui/utils.py:2891 -#: weko_search_ui/utils.py:2900 +#: weko_search_ui/utils.py:2783 weko_search_ui/utils.py:2927 +#: weko_search_ui/utils.py:2936 +#, python-brace-format msgid "{} cannot be set." msgstr "{}は設定できません。" -#: weko_search_ui/utils.py:2756 weko_search_ui/utils.py:2760 -#: weko_search_ui/utils.py:2829 weko_search_ui/utils.py:2968 +#: weko_search_ui/utils.py:2793 weko_search_ui/utils.py:2797 +#: weko_search_ui/utils.py:2865 weko_search_ui/utils.py:3005 +#, python-brace-format msgid "Specified {} is different from existing {}." msgstr "指定された{}は登録している{}と異なっています。" -#: weko_search_ui/utils.py:2780 +#: weko_search_ui/utils.py:2817 msgid "" "When assigning a DOI to an item, it must be associated with an index " "whose index status is \"Public\" and Harvest Publishing is \"Public\"." msgstr "" -#: weko_search_ui/utils.py:2785 +#: weko_search_ui/utils.py:2822 msgid "" "Since the item has a DOI, it must be associated with an index whose index" " status is \"Public\" and whose Harvest Publishing is \"Public\"." msgstr "アイテムにDOIが付与されているため、インデックス状態が「公開」かつハーベスト公開が「公開」のインデックスに関連付けが必要です。" -#: weko_search_ui/utils.py:2796 +#: weko_search_ui/utils.py:2832 msgid "You cannot keep an item private because it has a DOI." msgstr "アイテムにDOIが付与されているため、アイテムを非公開にすることはできません。" -#: weko_search_ui/utils.py:2850 weko_search_ui/utils.py:4070 +#: weko_search_ui/utils.py:2887 weko_search_ui/utils.py:4106 msgid "DOI_RA should be set by one of JaLC, Crossref, DataCite, NDL JaLC." msgstr "DOI_RAはJaLC,Crossref,DataCite,NDL JaLCのいずれかを設定してください。" -#: weko_search_ui/utils.py:3001 +#: weko_search_ui/utils.py:3037 +#, python-brace-format msgid "Item Link type: '{}' is not one of {}." msgstr "リンクタイプ'{}'は次の決められた選択肢に含まれていません。{}" -#: weko_search_ui/utils.py:3005 +#: weko_search_ui/utils.py:3041 msgid "Please specify Item URL for item link." msgstr "アイテムリンク先のURLを指定してください。" -#: weko_search_ui/utils.py:3019 +#: weko_search_ui/utils.py:3055 msgid "Specified Item Link URI and system URI do not match." msgstr "指定されたアイテムリンク先URIとシステムURIが一致しません。" -#: weko_search_ui/utils.py:3025 +#: weko_search_ui/utils.py:3061 msgid "Linking item does not exist in the system." msgstr "リンク先アイテムがシステムに存在しません。" -#: weko_search_ui/utils.py:3028 +#: weko_search_ui/utils.py:3064 msgid "Linking item already deleted in the system." msgstr "リンク先アイテムは削除済です。" -#: weko_search_ui/utils.py:3067 +#: weko_search_ui/utils.py:3103 msgid "It is not allowed to create links to the item itself." msgstr "自身へのアイテムリンクを作成することはできません。" -#: weko_search_ui/utils.py:3072 +#: weko_search_ui/utils.py:3108 +#, python-brace-format msgid "It is not allowed to create links other than {} between split items." msgstr "分割したアイテム間で{}以外のリンクを作成することはできません。" -#: weko_search_ui/utils.py:3108 +#: weko_search_ui/utils.py:3144 msgid "Duplicate Item Link." msgstr "重複するアイテムリンクを作成することはできません。" -#: weko_search_ui/utils.py:3447 +#: weko_search_ui/utils.py:3483 +#, python-brace-format msgid "" "One of the following required values ​​has not been " "registered.
{}
" msgstr "次のいずれかの必要値が登録していません。
{}
" -#: weko_search_ui/utils.py:3452 +#: weko_search_ui/utils.py:3489 +#, python-brace-format msgid "" "The mapping of required items for DOI validation is not set. Please " "recheck the following mapping settings.
{}" msgstr "" -#: weko_search_ui/utils.py:3462 +#: weko_search_ui/utils.py:3498 +#, python-brace-format msgid "The following metadata are required.
{}" msgstr "" -#: weko_search_ui/utils.py:3467 +#: weko_search_ui/utils.py:3504 +#, python-brace-format msgid "One of the following metadata is required.
{}
" msgstr "{}は必須項目です。" -#: weko_search_ui/utils.py:3530 weko_search_ui/utils.py:3542 +#: weko_search_ui/utils.py:3567 weko_search_ui/utils.py:3579 msgid "Please specify the date with any format of YYYY-MM-DD, YYYY-MM, YYYY." msgstr "日付はYYYY-MM-DD、YYYY-MM、YYYYのいずれかで指定してください。" -#: weko_search_ui/utils.py:3536 +#: weko_search_ui/utils.py:3572 +#, python-brace-format msgid "Replace value of {} from {} to {}." msgstr "{}の値を{}から{}へ置き換えました。" -#: weko_search_ui/utils.py:3559 +#: weko_search_ui/utils.py:3595 msgid "Please specify PubDate with YYYY-MM-DD." msgstr "公開日はYYYY-MM-DDで指定してください。" -#: weko_search_ui/utils.py:3589 +#: weko_search_ui/utils.py:3625 msgid "ID is specified for the newly registered item. Ignore the ID and register." msgstr "新規登録アイテムにIDが指定されています。IDを無視して登録を行います。" -#: weko_search_ui/utils.py:3672 +#: weko_search_ui/utils.py:3708 msgid "Please specify Open Access Date with YYYY-MM-DD." msgstr "オープンアクセスの日付はYYYY-MM-DDで指定してください。" -#: weko_search_ui/utils.py:3909 weko_search_ui/utils.py:4055 -#: weko_search_ui/utils.py:4061 +#: weko_search_ui/utils.py:3945 weko_search_ui/utils.py:4091 +#: weko_search_ui/utils.py:4097 msgid "Please specify DOI prefix/suffix." msgstr "DOIは prefix/suffix の形式で指定して下さい。" -#: weko_search_ui/utils.py:4047 +#: weko_search_ui/utils.py:4083 msgid "The specified DOI is wrong and fixed with the registered DOI." msgstr "" -#: weko_search_ui/utils.py:4050 +#: weko_search_ui/utils.py:4086 msgid "" "The specified DOI RA is wrong and fixed with the correct DOI RA of the " "registered DOI." msgstr "" -#: weko_search_ui/utils.py:4057 weko_search_ui/utils.py:4063 +#: weko_search_ui/utils.py:4093 weko_search_ui/utils.py:4099 msgid "Please specify DOI suffix." msgstr "" -#: weko_search_ui/utils.py:4066 +#: weko_search_ui/utils.py:4102 msgid "Do not specify DOI suffix." msgstr "" -#: weko_search_ui/utils.py:4072 +#: weko_search_ui/utils.py:4108 msgid "Specified Prefix of DOI is incorrect." msgstr "" -#: weko_search_ui/utils.py:4104 +#: weko_search_ui/utils.py:4141 msgid "" "Please specify the image file(gif, jpg, jpe, jpeg, png, bmp, tiff, tif) " "for the thumbnail." msgstr "サムネイルは画像ファイル(gif, jpg, jpe, jpeg, png, bmp, tiff, tif)を指定してください。" -#: weko_search_ui/utils.py:5220 +#: weko_search_ui/utils.py:5256 +#, python-brace-format msgid "The file specified in ({}) does not exist." msgstr "({})に指定したファイルが存在しません。" -#: weko_search_ui/utils.py:5224 +#: weko_search_ui/utils.py:5261 +#, python-brace-format msgid "" "The file specified in ({}) does not exist.
The file will not be " "updated. Update only the metadata with csv/tsv contents." msgstr "({})に指定したファイルが存在しません。
ファイルの更新はしません。csv/tsv内容でメタデータのみ更新します。" -#: weko_search_ui/utils.py:5511 +#: weko_search_ui/utils.py:5547 +#, python-brace-format msgid "The file name specified in {} and {} do not match." msgstr "{}に指定されたファイル名と{}が一致しません。" diff --git a/modules/weko-search-ui/weko_search_ui/translations/messages.pot b/modules/weko-search-ui/weko_search_ui/translations/messages.pot index c0f4ceb528..dee931c764 100644 --- a/modules/weko-search-ui/weko_search_ui/translations/messages.pot +++ b/modules/weko-search-ui/weko_search_ui/translations/messages.pot @@ -9,100 +9,165 @@ msgid "" msgstr "" "Project-Id-Version: weko-search-ui 0.1.0.dev20170000\n" "Report-Msgid-Bugs-To: wekosoftware@nii.ac.jp\n" -"POT-Creation-Date: 2025-05-27 19:16+0900\n" +"POT-Creation-Date: 2025-11-12 12:12+0900\n" "PO-Revision-Date: YEAR-MO-DA HO:MI+ZONE\n" "Last-Translator: FULL NAME \n" "Language-Team: LANGUAGE \n" "MIME-Version: 1.0\n" "Content-Type: text/plain; charset=utf-8\n" "Content-Transfer-Encoding: 8bit\n" -"Generated-By: Babel 2.5.1\n" +"Generated-By: Babel 2.17.0\n" -#: tests/conftest.py:399 +#: tests/conftest.py:409 msgid "write your own license" msgstr "" -#: tests/conftest.py:404 +#: tests/conftest.py:415 msgid "Creative Commons CC0 1.0 Universal Public Domain Designation" msgstr "" -#: tests/conftest.py:420 +#: tests/conftest.py:430 msgid "Creative Commons Attribution 3.0 Unported (CC BY 3.0)" msgstr "" -#: tests/conftest.py:432 +#: tests/conftest.py:443 msgid "Creative Commons Attribution-ShareAlike 3.0 Unported (CC BY-SA 3.0)" msgstr "" -#: tests/conftest.py:447 +#: tests/conftest.py:458 msgid "Creative Commons Attribution-NoDerivs 3.0 Unported (CC BY-ND 3.0)" msgstr "" -#: tests/conftest.py:461 +#: tests/conftest.py:472 msgid "Creative Commons Attribution-NonCommercial 3.0 Unported (CC BY-NC 3.0)" msgstr "" -#: tests/conftest.py:476 +#: tests/conftest.py:487 msgid "" "Creative Commons Attribution-NonCommercial-ShareAlike 3.0 Unported (CC " "BY-NC-SA 3.0)" msgstr "" -#: tests/conftest.py:491 +#: tests/conftest.py:502 msgid "" "Creative Commons Attribution-NonCommercial-NoDerivs 3.0 Unported (CC BY-" "NC-ND 3.0)" msgstr "" -#: tests/conftest.py:507 +#: tests/conftest.py:517 msgid "Creative Commons Attribution 4.0 International (CC BY 4.0)" msgstr "" -#: tests/conftest.py:519 +#: tests/conftest.py:530 msgid "Creative Commons Attribution-ShareAlike 4.0 International (CC BY-SA 4.0)" msgstr "" -#: tests/conftest.py:534 +#: tests/conftest.py:545 msgid "" "Creative Commons Attribution-NoDerivatives 4.0 International (CC BY-ND " "4.0)" msgstr "" -#: tests/conftest.py:549 +#: tests/conftest.py:560 msgid "" "Creative Commons Attribution-NonCommercial 4.0 International (CC BY-NC " "4.0)" msgstr "" -#: tests/conftest.py:564 +#: tests/conftest.py:575 msgid "" "Creative Commons Attribution-NonCommercial-ShareAlike 4.0 International " "(CC BY-NC-SA 4.0)" msgstr "" -#: tests/conftest.py:579 +#: tests/conftest.py:590 msgid "" "Creative Commons Attribution-NonCommercial-NoDerivatives 4.0 " "International (CC BY-NC-ND 4.0)" msgstr "" -#: weko_search_ui/admin.py:158 +#: tests/helpers.py:84 +msgid "Bagging a parent of the current directory is not supported" +msgstr "" + +#: tests/helpers.py:87 +#, python-format +msgid "Creating tag for directory %s" +msgstr "" + +#: tests/helpers.py:90 tests/helpers.py:91 +#, python-format +msgid "Bag directory %s does not exist" +msgstr "" + +#: tests/helpers.py:96 tests/helpers.py:97 +#, python-format +msgid "Bag directory %s does not contain a data directory" +msgstr "" + +#: tests/helpers.py:104 +#, python-format +msgid "" +"Unable to write to the following directories and files:\n" +"%s" +msgstr "" + +#: tests/helpers.py:107 +msgid "Missing permissions to move all files and directories" +msgstr "" + +#: tests/helpers.py:114 +#, python-format +msgid "" +"The following directories do not have read permissions:\n" +"%s" +msgstr "" + +#: tests/helpers.py:119 +#, python-format +msgid "" +"The following files do not have read permissions:\n" +"%s" +msgstr "" + +#: tests/helpers.py:123 +msgid "Read permissions are required to calculate file fixities" +msgstr "" + +#: tests/helpers.py:126 +msgid "Creating data directory" +msgstr "" + +#: tests/helpers.py:143 +msgid "Creating bagit.txt" +msgstr "" + +#: tests/helpers.py:148 +msgid "Creating bag-info.txt" +msgstr "" + +#: tests/helpers.py:167 +#, python-format +msgid "An error occurred creating a bag in %s" +msgstr "" + +#: weko_search_ui/admin.py:157 msgid "The following item(s) cannot be deleted." msgstr "" -#: weko_search_ui/admin.py:163 +#: weko_search_ui/admin.py:162 msgid "DOI granting item(s):" msgstr "" -#: weko_search_ui/admin.py:168 +#: weko_search_ui/admin.py:167 msgid "Editing item(s):" msgstr "" -#: weko_search_ui/admin.py:171 +#: weko_search_ui/admin.py:170 msgid "Success" msgstr "" -#: weko_search_ui/admin.py:204 +#: weko_search_ui/admin.py:203 msgid "Index Delete is in progress on another device." msgstr "" @@ -113,27 +178,27 @@ msgid "" "you want to continue deleting items that are not grant DOI?" msgstr "" -#: weko_search_ui/admin.py:216 +#: weko_search_ui/admin.py:215 msgid "Are you sure you want to delete it?" msgstr "" -#: weko_search_ui/admin.py:219 +#: weko_search_ui/admin.py:218 msgid "No such index." msgstr "" -#: weko_search_ui/admin.py:310 weko_search_ui/admin.py:1243 +#: weko_search_ui/admin.py:309 weko_search_ui/admin.py:1250 msgid "Custom Sort" msgstr "" -#: weko_search_ui/admin.py:312 weko_search_ui/admin.py:1234 +#: weko_search_ui/admin.py:311 weko_search_ui/admin.py:1241 msgid "Bulk Delete" msgstr "" -#: weko_search_ui/admin.py:325 +#: weko_search_ui/admin.py:324 msgid "Bulk Update" msgstr "" -#: weko_search_ui/admin.py:440 weko_search_ui/admin.py:868 +#: weko_search_ui/admin.py:439 weko_search_ui/admin.py:872 #: weko_search_ui/templates/weko_search_ui/admin/export.html:53 #: weko_search_ui/templates/weko_search_ui/admin/import.html:96 #: weko_search_ui/templates/weko_search_ui/admin/rocrate_import.html:97 @@ -141,29 +206,29 @@ msgstr "" msgid "Internal server error" msgstr "" -#: weko_search_ui/admin.py:1225 weko_search_ui/admin.py:1242 +#: weko_search_ui/admin.py:1232 weko_search_ui/admin.py:1249 #: weko_search_ui/templates/weko_search_ui/admin/import.html:53 #: weko_search_ui/templates/weko_search_ui/admin/rocrate_import.html:54 msgid "Index Tree" msgstr "" -#: weko_search_ui/admin.py:1233 weko_search_ui/admin.py:1251 -#: weko_search_ui/admin.py:1260 weko_search_ui/admin.py:1270 +#: weko_search_ui/admin.py:1240 weko_search_ui/admin.py:1258 +#: weko_search_ui/admin.py:1267 weko_search_ui/admin.py:1277 msgid "Items" msgstr "" -#: weko_search_ui/admin.py:1252 +#: weko_search_ui/admin.py:1259 #: weko_search_ui/templates/weko_search_ui/admin/import.html:42 #: weko_search_ui/templates/weko_search_ui/admin/rocrate_import.html:43 msgid "Import" msgstr "" -#: weko_search_ui/admin.py:1261 +#: weko_search_ui/admin.py:1268 #: weko_search_ui/templates/weko_search_ui/admin/rocrate_import.html:42 msgid "RO-Crate Import" msgstr "" -#: weko_search_ui/admin.py:1271 +#: weko_search_ui/admin.py:1278 msgid "Bulk Export" msgstr "" @@ -171,23 +236,53 @@ msgstr "" msgid "contents" msgstr "" -#: weko_search_ui/mapper.py:1360 +#: weko_search_ui/mapper.py:1375 +#, python-brace-format msgid "\"{key}\" is required." msgstr "" -#: weko_search_ui/mapper.py:1381 +#: weko_search_ui/mapper.py:1396 +#, python-brace-format msgid "\"{key}\" is not in itemtype." msgstr "" -#: weko_search_ui/mapper.py:1383 +#: weko_search_ui/mapper.py:1398 +#, python-brace-format msgid "\"{key}\" is not in itemtype, did you mean \"{similar_key}\"?" msgstr "" -#: weko_search_ui/tasks.py:328 +#: weko_search_ui/mapper.py:1517 +#, python-format +msgid "" +"Cannot map to item type from json-ld; Mapping is not defined for the " +"metadata, \"%(key)s\": \"%(value)s\"" +msgstr "" + +#: weko_search_ui/mapper.py:1543 +#, python-format +msgid "" +"Cannot map to item type from json-ld; Not found mapping destination for " +"the metadata, \"%(key)s\": \"%(value)s\"" +msgstr "" + +#: weko_search_ui/mapper.py:1553 +#, python-format +msgid "Failed to set metadata for json-ld, \"%(key)s\": \"%(value)s\"" +msgstr "" + +#: weko_search_ui/mapper.py:1572 +msgid "Metadata which could not be mapped to item type will be set in 'Extra'." +msgstr "" + +#: weko_search_ui/mapper.py:1576 +msgid "Metadata which could not be mapped to item type will be discarded." +msgstr "" + +#: weko_search_ui/tasks.py:337 msgid "`wk:metadata_replace` flag cannot be used in RO-Crate Import." msgstr "" -#: weko_search_ui/tasks.py:343 +#: weko_search_ui/tasks.py:352 msgid "`wk:isSplited` flag cannot be used in RO-Crate Import." msgstr "" @@ -195,25 +290,28 @@ msgstr "" msgid "The same item may have been registered." msgstr "" -#: weko_search_ui/utils.py:592 weko_search_ui/utils.py:708 +#: weko_search_ui/utils.py:593 weko_search_ui/utils.py:709 +#, python-brace-format msgid "" "The format of the specified file {} does not support import. Please " "specify one of the following formats: zip, tar, gztar, bztar, xztar." msgstr "" -#: weko_search_ui/utils.py:600 +#: weko_search_ui/utils.py:601 +#, python-brace-format msgid "" "The csv/tsv file was not found in the specified file {}. Check if the " "directory structure is correct." msgstr "" -#: weko_search_ui/utils.py:649 +#: weko_search_ui/utils.py:650 msgid "" "The item type of the item to be imported is missing or has already been " "deleted." msgstr "" -#: weko_search_ui/utils.py:715 +#: weko_search_ui/utils.py:716 +#, python-brace-format msgid "" "The xml file was not found in the specified file {}. Check if the " "directory structure is correct." @@ -223,268 +321,305 @@ msgstr "" msgid "The item type ID specified in the XML file does not exist." msgstr "" -#: weko_search_ui/utils.py:1215 +#: weko_search_ui/utils.py:1206 +#, python-brace-format msgid "" "There is an error in the format of the first line of the header of the {}" " file." msgstr "" -#: weko_search_ui/utils.py:1234 +#: weko_search_ui/utils.py:1225 +#, python-brace-format msgid "The item type ID specified in the {} file does not exist." msgstr "" -#: weko_search_ui/utils.py:1243 +#: weko_search_ui/utils.py:1236 msgid "Cannot register because the specified item type is not the latest version." msgstr "" -#: weko_search_ui/utils.py:1258 +#: weko_search_ui/utils.py:1250 +#, python-brace-format msgid "The following metadata keys are duplicated.
{}" msgstr "" -#: weko_search_ui/utils.py:1281 +#: weko_search_ui/utils.py:1274 +#, python-brace-format msgid "The item does not consistent with the specified item type.
{}" msgstr "" -#: weko_search_ui/utils.py:1311 +#: weko_search_ui/utils.py:1303 +#, python-brace-format msgid "Cannot read {} file correctly." msgstr "" -#: weko_search_ui/utils.py:1331 +#: weko_search_ui/utils.py:1328 +#, python-brace-format msgid "" "The following items are not registered because they do not exist in the " "specified item type. {}" msgstr "" -#: weko_search_ui/utils.py:1341 +#: weko_search_ui/utils.py:1336 +#, python-brace-format msgid "" "The {} file could not be read. Make sure the file format is {} and that " "the file is UTF-8 encoded." msgstr "" -#: weko_search_ui/utils.py:1372 +#: weko_search_ui/utils.py:1369 msgid "" "The XML file could not be read. Make sure the file format is XML and that" " the file is UTF-8 encoded." msgstr "" -#: weko_search_ui/utils.py:1444 +#: weko_search_ui/utils.py:1441 msgid "Please specify item ID by half-width number." msgstr "" -#: weko_search_ui/utils.py:1459 +#: weko_search_ui/utils.py:1462 +#, python-format +msgid "Replace value of %(target_path)s from %(old_value)s to '%(new_value)s'." +msgstr "" + +#: weko_search_ui/utils.py:1475 msgid "Specified item type does not exist." msgstr "" -#: weko_search_ui/utils.py:1533 +#: weko_search_ui/utils.py:1481 +#, python-format +msgid "Specified %(type)s is different from existing %(existing_type)s." +msgstr "" + +#: weko_search_ui/utils.py:1556 msgid "Specified URI and system URI do not match." msgstr "" -#: weko_search_ui/utils.py:1545 +#: weko_search_ui/utils.py:1568 msgid "Item does not exist in the system." msgstr "" -#: weko_search_ui/utils.py:1552 +#: weko_search_ui/utils.py:1575 msgid "Item already DELETED in the system." msgstr "" -#: weko_search_ui/utils.py:1569 +#: weko_search_ui/utils.py:1592 msgid "Please specify either \"Keep\" or \"Upgrade\"." msgstr "" -#: weko_search_ui/utils.py:2472 +#: weko_search_ui/utils.py:2508 msgid "Title is required item." msgstr "" -#: weko_search_ui/utils.py:2489 +#: weko_search_ui/utils.py:2525 +#, python-brace-format msgid "{} is required item." msgstr "" -#: weko_search_ui/utils.py:2492 +#: weko_search_ui/utils.py:2528 +#, python-brace-format msgid "Please set \"public\" or \"private\" for {}." msgstr "" -#: weko_search_ui/utils.py:2533 +#: weko_search_ui/utils.py:2569 +#, python-brace-format msgid "The specified {} does not exist in system." msgstr "" -#: weko_search_ui/utils.py:2543 +#: weko_search_ui/utils.py:2579 +#, python-brace-format msgid "Specified {} does not match with existing index." msgstr "" -#: weko_search_ui/utils.py:2587 +#: weko_search_ui/utils.py:2623 msgid "Your role cannot register items in this index." msgstr "" -#: weko_search_ui/utils.py:2608 +#: weko_search_ui/utils.py:2644 msgid "Both of IndexID and POS_INDEX are not being set." msgstr "" -#: weko_search_ui/utils.py:2654 weko_search_ui/utils.py:2679 +#: weko_search_ui/utils.py:2690 weko_search_ui/utils.py:2715 +#, python-brace-format msgid "Specified {} is invalid." msgstr "" -#: weko_search_ui/utils.py:2721 weko_search_ui/utils.py:2754 -#: weko_search_ui/utils.py:2846 weko_search_ui/utils.py:2916 -#: weko_search_ui/utils.py:2920 weko_search_ui/utils.py:2942 -#: weko_search_ui/utils.py:2966 +#: weko_search_ui/utils.py:2757 weko_search_ui/utils.py:2790 +#: weko_search_ui/utils.py:2882 weko_search_ui/utils.py:2952 +#: weko_search_ui/utils.py:2956 weko_search_ui/utils.py:2978 +#: weko_search_ui/utils.py:3002 +#, python-brace-format msgid "Please specify {}." msgstr "" -#: weko_search_ui/utils.py:2724 weko_search_ui/utils.py:2923 +#: weko_search_ui/utils.py:2760 weko_search_ui/utils.py:2960 +#, python-brace-format msgid "The specified {} exceeds the maximum length." msgstr "" -#: weko_search_ui/utils.py:2739 weko_search_ui/utils.py:2897 -#: weko_search_ui/utils.py:2907 weko_search_ui/utils.py:2938 +#: weko_search_ui/utils.py:2775 weko_search_ui/utils.py:2933 +#: weko_search_ui/utils.py:2943 weko_search_ui/utils.py:2974 +#, python-brace-format msgid "Specified Prefix of {} is incorrect." msgstr "" -#: weko_search_ui/utils.py:2747 weko_search_ui/utils.py:2891 -#: weko_search_ui/utils.py:2900 +#: weko_search_ui/utils.py:2783 weko_search_ui/utils.py:2927 +#: weko_search_ui/utils.py:2936 +#, python-brace-format msgid "{} cannot be set." msgstr "" -#: weko_search_ui/utils.py:2756 weko_search_ui/utils.py:2760 -#: weko_search_ui/utils.py:2829 weko_search_ui/utils.py:2968 +#: weko_search_ui/utils.py:2793 weko_search_ui/utils.py:2797 +#: weko_search_ui/utils.py:2865 weko_search_ui/utils.py:3005 +#, python-brace-format msgid "Specified {} is different from existing {}." msgstr "" -#: weko_search_ui/utils.py:2780 +#: weko_search_ui/utils.py:2817 msgid "" "When assigning a DOI to an item, it must be associated with an index " "whose index status is \"Public\" and Harvest Publishing is \"Public\"." msgstr "" -#: weko_search_ui/utils.py:2785 +#: weko_search_ui/utils.py:2822 msgid "" "Since the item has a DOI, it must be associated with an index whose index" " status is \"Public\" and whose Harvest Publishing is \"Public\"." msgstr "" -#: weko_search_ui/utils.py:2796 +#: weko_search_ui/utils.py:2832 msgid "You cannot keep an item private because it has a DOI." msgstr "" -#: weko_search_ui/utils.py:2850 weko_search_ui/utils.py:4070 +#: weko_search_ui/utils.py:2887 weko_search_ui/utils.py:4106 msgid "DOI_RA should be set by one of JaLC, Crossref, DataCite, NDL JaLC." msgstr "" -#: weko_search_ui/utils.py:3001 +#: weko_search_ui/utils.py:3037 +#, python-brace-format msgid "Item Link type: '{}' is not one of {}." msgstr "" -#: weko_search_ui/utils.py:3005 +#: weko_search_ui/utils.py:3041 msgid "Please specify Item URL for item link." msgstr "" -#: weko_search_ui/utils.py:3019 +#: weko_search_ui/utils.py:3055 msgid "Specified Item Link URI and system URI do not match." msgstr "" -#: weko_search_ui/utils.py:3025 +#: weko_search_ui/utils.py:3061 msgid "Linking item does not exist in the system." msgstr "" -#: weko_search_ui/utils.py:3028 +#: weko_search_ui/utils.py:3064 msgid "Linking item already deleted in the system." msgstr "" -#: weko_search_ui/utils.py:3067 +#: weko_search_ui/utils.py:3103 msgid "It is not allowed to create links to the item itself." msgstr "" -#: weko_search_ui/utils.py:3072 +#: weko_search_ui/utils.py:3108 +#, python-brace-format msgid "It is not allowed to create links other than {} between split items." msgstr "" -#: weko_search_ui/utils.py:3108 +#: weko_search_ui/utils.py:3144 msgid "Duplicate Item Link." msgstr "" -#: weko_search_ui/utils.py:3447 +#: weko_search_ui/utils.py:3483 +#, python-brace-format msgid "" "One of the following required values ​​has not been " "registered.
{}
" msgstr "" -#: weko_search_ui/utils.py:3452 +#: weko_search_ui/utils.py:3489 +#, python-brace-format msgid "" "The mapping of required items for DOI validation is not set. Please " "recheck the following mapping settings.
{}" msgstr "" -#: weko_search_ui/utils.py:3462 +#: weko_search_ui/utils.py:3498 +#, python-brace-format msgid "The following metadata are required.
{}" msgstr "" -#: weko_search_ui/utils.py:3467 +#: weko_search_ui/utils.py:3504 +#, python-brace-format msgid "One of the following metadata is required.
{}
" msgstr "" -#: weko_search_ui/utils.py:3530 weko_search_ui/utils.py:3542 +#: weko_search_ui/utils.py:3567 weko_search_ui/utils.py:3579 msgid "Please specify the date with any format of YYYY-MM-DD, YYYY-MM, YYYY." msgstr "" -#: weko_search_ui/utils.py:3536 +#: weko_search_ui/utils.py:3572 +#, python-brace-format msgid "Replace value of {} from {} to {}." msgstr "" -#: weko_search_ui/utils.py:3559 +#: weko_search_ui/utils.py:3595 msgid "Please specify PubDate with YYYY-MM-DD." msgstr "" -#: weko_search_ui/utils.py:3589 +#: weko_search_ui/utils.py:3625 msgid "ID is specified for the newly registered item. Ignore the ID and register." msgstr "" -#: weko_search_ui/utils.py:3672 +#: weko_search_ui/utils.py:3708 msgid "Please specify Open Access Date with YYYY-MM-DD." msgstr "" -#: weko_search_ui/utils.py:3909 weko_search_ui/utils.py:4055 -#: weko_search_ui/utils.py:4061 +#: weko_search_ui/utils.py:3945 weko_search_ui/utils.py:4091 +#: weko_search_ui/utils.py:4097 msgid "Please specify DOI prefix/suffix." msgstr "" -#: weko_search_ui/utils.py:4047 +#: weko_search_ui/utils.py:4083 msgid "The specified DOI is wrong and fixed with the registered DOI." msgstr "" -#: weko_search_ui/utils.py:4050 +#: weko_search_ui/utils.py:4086 msgid "" "The specified DOI RA is wrong and fixed with the correct DOI RA of the " "registered DOI." msgstr "" -#: weko_search_ui/utils.py:4057 weko_search_ui/utils.py:4063 +#: weko_search_ui/utils.py:4093 weko_search_ui/utils.py:4099 msgid "Please specify DOI suffix." msgstr "" -#: weko_search_ui/utils.py:4066 +#: weko_search_ui/utils.py:4102 msgid "Do not specify DOI suffix." msgstr "" -#: weko_search_ui/utils.py:4072 +#: weko_search_ui/utils.py:4108 msgid "Specified Prefix of DOI is incorrect." msgstr "" -#: weko_search_ui/utils.py:4104 +#: weko_search_ui/utils.py:4141 msgid "" "Please specify the image file(gif, jpg, jpe, jpeg, png, bmp, tiff, tif) " "for the thumbnail." msgstr "" -#: weko_search_ui/utils.py:5220 +#: weko_search_ui/utils.py:5256 +#, python-brace-format msgid "The file specified in ({}) does not exist." msgstr "" -#: weko_search_ui/utils.py:5224 +#: weko_search_ui/utils.py:5261 +#, python-brace-format msgid "" "The file specified in ({}) does not exist.
The file will not be " "updated. Update only the metadata with csv/tsv contents." msgstr "" -#: weko_search_ui/utils.py:5511 +#: weko_search_ui/utils.py:5547 +#, python-brace-format msgid "The file name specified in {} and {} do not match." msgstr "" diff --git a/modules/weko-search-ui/weko_search_ui/utils.py b/modules/weko-search-ui/weko_search_ui/utils.py index e55b8064d0..3df6d0aba3 100644 --- a/modules/weko-search-ui/weko_search_ui/utils.py +++ b/modules/weko-search-ui/weko_search_ui/utils.py @@ -923,6 +923,7 @@ def check_jsonld_import_items( with open(f"{data_path}/{json_name}", "r") as f: json_ld = json.load(f) + mapper.data_path = data_path item_metadatas, _ = mapper.to_item_metadata(json_ld) list_record = [ { @@ -1432,6 +1433,7 @@ def handle_validate_item_import(list_record, schema) -> list: v2 = Draft4Validator(schema) if schema else None for record in list_record: errors = record.get("errors") or [] + warnings = [] record_id = record.get("id") if record_id and ( not represents_int(record_id) or re.search(r"([0-9])", record_id) @@ -1443,19 +1445,45 @@ def handle_validate_item_import(list_record, schema) -> list: if record.get("metadata"): if v2: a = v2.iter_errors(record.get("metadata")) + for error in a: + if ( + error.validator == "type" + and error.validator_value == "string" + and isinstance(error.instance, int) + ): + target = record["metadata"] + path_list = list(error.path) + for key in path_list[:-1]: + target = target[key] + last_key = path_list[-1] + target[last_key] = str(target[last_key]) + target_path = ".".join([str(p) for p in path_list[:-2]]) + warnings.append( + _("Replace value of %(target_path)s from %(old_value)s to '%(new_value)s'.", + target_path=target_path, old_value=target[last_key], new_value=str(target[last_key]) + ) + ) + b = v2.iter_errors(record.get("metadata")) if current_i18n.language == "ja": _errors = [] - for error in a: + for error in b: _errors.append(handle_convert_validate_msg_to_jp(error.message)) errors = errors + _errors else: - errors = errors + [error.message for error in a] + errors = errors + [error.message for error in b] else: errors = errors = errors + [_("Specified item type does not exist.")] - item_error = dict(**record) - item_error["errors"] = errors if len(errors) else None - result.append(item_error) + records = dict(**record) + records["errors"] = errors if len(errors) else None + if len(warnings) > 0: + warnings.append( + _("Specified %(type)s is different from existing %(existing_type)s.", + type="type:integer", existing_type="type:string" + ) + ) + records["warnings"] = warnings if len(warnings) else None + result.append(records) return result diff --git a/nginx/ams/weko-frontend/components/detail/Section.vue b/nginx/ams/weko-frontend/components/detail/Section.vue index 2e4a4cb916..3141814352 100644 --- a/nginx/ams/weko-frontend/components/detail/Section.vue +++ b/nginx/ams/weko-frontend/components/detail/Section.vue @@ -1,7 +1,7 @@