-# Java Gradle CircleCI 2.0 configuration file
-# Check https://circleci.com/docs/2.0/language-java/ for more details
-version: 2
- build:
- docker:
- # specify the version you desire here
- - image: circleci/openjdk:11-jdk
- # Specify service dependencies here if necessary
- # CircleCI maintains a library of pre-built images
- # documented at https://circleci.com/docs/2.0/circleci-images/
- # - image: circleci/postgres:9.4
- working_directory: ~/repo
- environment:
- # Customize the JVM maximum heap limit
- JVM_OPTS: -Xmx3200m
- TERM: dumb
- steps:
- - checkout
- # Download and cache dependencies
- - restore_cache:
- keys:
- - v1-dependencies-{{ checksum "build.gradle" }}
- # fallback to using the latest cache if no exact match is found
- - v1-dependencies-
- - run: ./gradlew dependencies
- - save_cache:
- paths:
- - ~/.gradle
- key: v1-dependencies-{{ checksum "build.gradle" }}
- # run tests!
- - run: ./gradlew test jacocoTestReport coveralls --no-daemon
- - store_test_results:
- path: build/reports/jacoco/test/jacocoTestReport.xml
- - store_test_results:
- path: build/reports/tests/test
- - store_artifacts:
- path: build/reports/jacoco/test/jacocoTestReport.xml
- - store_artifacts:
- path: build/reports/tests/test
- - store_artifacts:
- path: build/reports/jacoco/test/html/index.html
- - store_artifacts:
- path: build/reports/tests/test/index.html
\ No newline at end of file
id: docker_build
new file mode 100644
index 00000000..476bfa1e
--- /dev/null
+++ b/CITATION.cff
@@ -0,0 +1,54 @@
+cff-version: 1.2.0
+message: "If you use this software, please cite it as below."
+- family-names: "Foppiano"
+ given-names: "Luca"
+ orcid: "https://orcid.org/0000-0002-6114-6164"
+- family-names: "de Castro"
+ given-names: "Pedro Baptista"
+ orcid: "https://orcid.org/0000-0001-8673-2840"
+- family-names: "Ortiz Suarez"
+ given-names: "Pedro"
+ orcid: "https://orcid.org/0000-0003-0343-8852"
+- family-names: "Terashima"
+ given-names: "Kensei"
+ orcid: "https://orcid.org/0000-0003-0375-3043"
+- family-names: "Takano"
+ given-names: "Yoshihiko"
+ orcid: "https://orcid.org/0000-0002-1541-6928"
+- family-names: "Ishii"
+ given-names: "Masashi"
+ orcid: "https://orcid.org/0000-0003-0357-2832"
+title: "grobid-superconductors"
+version: 2.0.4
+url: "https://github.com/lfoppiano/grobid-superconductors"
+ type: article
+ authors:
+ - family-names: "Foppiano"
+ given-names: "Luca"
+ orcid: "https://orcid.org/0000-0002-6114-6164"
+ - family-names: "de Castro"
+ given-names: "Pedro Baptista"
+ orcid: "https://orcid.org/0000-0001-8673-2840"
+ - family-names: "Ortiz Suarez"
+ given-names: "Pedro"
+ orcid: "https://orcid.org/0000-0003-0343-8852"
+ - family-names: "Terashima"
+ given-names: "Kensei"
+ orcid: "https://orcid.org/0000-0003-0375-3043"
+ - family-names: "Takano"
+ given-names: "Yoshihiko"
+ orcid: "https://orcid.org/0000-0002-1541-6928"
+ - family-names: "Ishii"
+ given-names: "Masashi"
+ orcid: "https://orcid.org/0000-0003-0357-2832"
+ doi: "10.1080/27660400.2022.2153633"
+ journal: " Science and Technology of Advanced Materials: Methods"
+ month: 1
+# start: 1 # First page number
+# end: 10 # Last page number
+ title: "Automatic extraction of materials and properties from superconductors scientific literature"
+ issue: 1
+ volume: 3
+ year: 2023
-RUN ./gradlew downloadTransformers --no-daemon --info --stacktrace && rm -f /opt/grobid-source/grobid-home/models/*.zip
+# Preparing distribution
+WORKDIR /opt/grobid-source/grobid-superconductors_source
@@ -74,21 +65,22 @@ WORKDIR /opt
# build runtime image
# -------------------
-FROM grobid/grobid:0.7.2 as runtime
+FROM lfoppiano/grobid-quantities:0.8.0 as runtime
# setting locale is likely useless but to be sure
-# Install SO dependencies
-RUN apt-get update && \
- apt-get -y --no-install-recommends install git wget
WORKDIR /opt/grobid
-RUN mkdir -p /opt/grobid/grobid-superconductors
+RUN rm -rf /opt/grobid/grobid-quantities \
+ && rm /opt/grobid/resources \
+ && mkdir -p /opt/grobid/grobid-superconductors \
+ && rm -rf /opt/grobid/grobid-home/models/*.-with_ELMo \
+ && rm -rf /opt/grobid/grobid-service
COPY --from=builder /opt/grobid-source/grobid-home/models ./grobid-home/models
-COPY --from=builder /opt/grobid-source/grobid-superconductors/build/libs/* ./grobid-superconductors/
-COPY --from=builder /opt/grobid-source/grobid-superconductors/resources/config/config.yml ./grobid-superconductors/
+COPY --from=builder /opt/grobid-source/grobid-superconductors ./grobid-superconductors/
+COPY --from=builder /opt/grobid-source/grobid-superconductors_source/resources/config/config-docker.yml ./grobid-superconductors/resources/config/config.yml
VOLUME ["/opt/grobid/grobid-home/tmp"]
@@ -96,13 +88,6 @@ RUN pip install -U git+https://github.com/kermitt2/delft.git
WORKDIR /opt/grobid
-#RUN sed -i 's/pythonVirtualEnv:.*/pythonVirtualEnv: \/opt\/grobid\/venv/g' grobid-superconductors/config.yml
-RUN sed -i 's/pythonVirtualEnv:.*/pythonVirtualEnv: /g' grobid-superconductors/config.yml
-RUN sed -i 's/grobidHome:.*/grobidHome: grobid-home/g' grobid-superconductors/config.yml
-RUN sed -i 's/chemDataExtractorUrl:.*/chemDataExtractorUrl: ${CDE_URL:- http:\/\/cde.local:8080}/g' grobid-superconductors/config.yml
-RUN sed -i 's/linkingModuleUrl:.*/linkingModuleUrl: ${LINKING_MODULE_URL:- http:\/\/linking_module.local:8080}/g' grobid-superconductors/config.yml
-RUN sed -i 's/classResolverUrl:.*/classResolverUrl: ${LINKING_MODULE_URL:- http:\/\/linking_module.local:8080}/g' grobid-superconductors/config.yml
## Select transformers model
@@ -113,18 +98,24 @@ RUN if [[ -z "$TRANSFORMERS_MODEL" ]] ; then echo "Using Scibert as default tran
# tar -xzf /tmp/jprofiler_linux_12_0_2.tar.gz -C /usr/local &&\
# rm /tmp/jprofiler_linux_12_0_2.tar.gz
-EXPOSE 8072 8073
+WORKDIR /opt/grobid
+ENV GROBID_SUPERCONDUCTORS_OPTS "-Djava.library.path=/opt/grobid/grobid-home/lib/lin-64:/usr/local/lib/python3.8/dist-packages/jep --add-opens java.base/java.lang=ALL-UNNAMED"
+ENV LINKING_MODULE_URL "http://linking_module.local:8080"
+ENV CDE_URL "http://cde.local:8080"
+EXPOSE 8072 8073
-RUN if [ ! -f "grobid-superconductors/grobid-superconductors-${GROBID_VERSION}-onejar.jar" ]; then mv grobid-superconductors/grobid-superconductors-*-onejar.jar grobid-superconductors/grobid-superconductors-${GROBID_VERSION}-onejar.jar; fi
+# RUN if [ ! -f "grobid-superconductors/grobid-superconductors-${GROBID_VERSION}-onejar.jar" ]; then mv grobid-superconductors/grobid-superconductors-*-onejar.jar grobid-superconductors/grobid-superconductors-${GROBID_VERSION}-onejar.jar; fi
#RUN if [ "${!GROBID_VERSION}" = "unknown" ] ; then GROBID_VERSION=`ls grobid-superconductors/grobid-superconductors-*onejar.jar | grep -oE '[0-9]\.[0-9]\.[0-9](-SNAPSHOT)?' | head -n 1`; fi
#CMD ["java", "-agentlib:jdwp=transport=dt_socket,server=y,suspend=y,address=*:5005", "-jar", "grobid-superconductors/grobid-superconductors-0.5.2-SNAPSHOT-onejar.jar", "server", "grobid-superconductors/config.yml"]
#CMD ["java", "-agentpath:/usr/local/jprofiler12.0.2/bin/linux-x64/libjprofilerti.so=port=8849", "-jar", "grobid-superconductors/grobid-superconductors-0.2.1-SNAPSHOT-onejar.jar", "server", "grobid-superconductors/config.yml"]
-CMD ["sh", "-c", "java -jar grobid-superconductors/grobid-superconductors-${GROBID_VERSION}-onejar.jar server grobid-superconductors/config.yml"]
+#CMD ["sh", "-c", "java -jar grobid-superconductors/grobid-superconductors-${GROBID_VERSION}-onejar.jar server grobid-superconductors/config.yml"]
+CMD ["./grobid-superconductors/bin/grobid-superconductors", "server", "grobid-superconductors/resources/config/config.yml"]
diff --git a/README.md b/README.md
index d36f4e08..bfdb8346 100644
--- a/README.md
+++ b/README.md
@@ -1,12 +1,11 @@
-# Grobid superconductors module
+# Grobid superconductors
[![Docker Hub](https://img.shields.io/docker/pulls/lfoppiano/grobid-superconductors.svg)](https://hub.docker.com/r/lfoppiano/grobid-superconductors/ "Docker Pulls")
[![Coverage Status](https://coveralls.io/repos/github/lfoppiano/grobid-superconductors/badge.svg?branch=master)](https://coveralls.io/github/lfoppiano/grobid-superconductors?branch=master)
-[![Build unstable](https://github.com/lfoppiano/grobid-superconductors/actions/workflows/ci-build-unstable.yml/badge.svg)](https://github.com/lfoppiano/grobid-superconductors/actions/workflows/ci-build-unstable.yml)
-__Work in progress.__
+[![Demo grobid-superconductors](https://img.shields.io/website-up-down-green-red/https/lfoppiano-grobid-superconductors.hf.space.svg)](https://lfoppiano-grobid-superconductors.hf.space)
+[![Open in Spaces](https://huggingface.co/datasets/huggingface/badges/raw/main/open-in-hf-spaces-sm.svg)](https://lfoppiano-grobid-superconductors.hf.space/)
* [Introduction](#introduction)
* [Getting started](#getting-started)
@@ -419,6 +418,8 @@ Our warmest thanks to [Patrice Lopez](https://github.com/kermitt2) from [Science
This project has been developed at the [National Institute for Materials Science](http://www.nims.go.jp), in [Tsukuba](https://en.wikipedia.org/wiki/Tsukuba,_Ibaraki), Japan.
+Developed using ![JetBrains Logo (Main) logo](https://resources.jetbrains.com/storage/products/company/brand/logos/jb_beam.svg)
## License
GROBID and grobid-superconductors are distributed under [Apache 2.0 license](http://www.apache.org/licenses/LICENSE-2.0).
@@ -432,56 +433,56 @@ We described the framework around the system in the following articles (the late
- [Automatic Extraction of Materials and Properties from Superconductors Scientific Literature ](https://hal.inria.fr/hal-03776658)
- @article{doi:10.1080/27660400.2022.2153633,
- author = {Luca Foppiano and Pedro Baptista Castro and Pedro Ortiz Suarez and Kensei Terashima and Yoshihiko Takano and Masashi Ishii},
- title = {Automatic extraction of materials and properties from superconductors scientific literature},
- journal = {Science and Technology of Advanced Materials: Methods},
- volume = {3},
- number = {1},
- pages = {2153633},
- year = {2023},
- publisher = {Taylor & Francis},
- doi = {10.1080/27660400.2022.2153633},
- URL = {
- https://doi.org/10.1080/27660400.2022.2153633
- },
- eprint = {
- https://doi.org/10.1080/27660400.2022.2153633
+ @article{doi:10.1080/27660400.2022.2153633,
+ author = {Luca Foppiano and Pedro Baptista Castro and Pedro Ortiz Suarez and Kensei Terashima and Yoshihiko Takano and Masashi Ishii},
+ title = {Automatic extraction of materials and properties from superconductors scientific literature},
+ journal = {Science and Technology of Advanced Materials: Methods},
+ volume = {3},
+ number = {1},
+ pages = {2153633},
+ year = {2023},
+ publisher = {Taylor & Francis},
+ doi = {10.1080/27660400.2022.2153633},
+ URL = {
+ https://doi.org/10.1080/27660400.2022.2153633
+ },
+ eprint = {
+ https://doi.org/10.1080/27660400.2022.2153633
+ }
- }
- [SuperMat](http://github.com/lfoppiano/Supermat): construction of a linked annotated dataset from superconductors-related publications
- @article{doi:10.1080/27660400.2021.1918396,
- author = {Luca Foppiano and Sae Dieb and Akira Suzuki and Pedro Baptista de Castro and Suguru Iwasaki and Azusa Uzuki and Miren Garbine Esparza Echevarria and Yan Meng and Kensei Terashima and Laurent Romary and Yoshihiko Takano and Masashi Ishii},
- title = {SuperMat: construction of a linked annotated dataset from superconductors-related publications},
- journal = {Science and Technology of Advanced Materials: Methods},
- volume = {1},
- number = {1},
- pages = {34-44},
- year = {2021},
- publisher = {Taylor & Francis},
- doi = {10.1080/27660400.2021.1918396},
- URL = { https://doi.org/10.1080/27660400.2021.1918396 },
- eprint = { https://doi.org/10.1080/27660400.2021.1918396 }
- }
+ @article{doi:10.1080/27660400.2021.1918396,
+ author = {Luca Foppiano and Sae Dieb and Akira Suzuki and Pedro Baptista de Castro and Suguru Iwasaki and Azusa Uzuki and Miren Garbine Esparza Echevarria and Yan Meng and Kensei Terashima and Laurent Romary and Yoshihiko Takano and Masashi Ishii},
+ title = {SuperMat: construction of a linked annotated dataset from superconductors-related publications},
+ journal = {Science and Technology of Advanced Materials: Methods},
+ volume = {1},
+ number = {1},
+ pages = {34-44},
+ year = {2021},
+ publisher = {Taylor & Francis},
+ doi = {10.1080/27660400.2021.1918396},
+ URL = { https://doi.org/10.1080/27660400.2021.1918396 },
+ eprint = { https://doi.org/10.1080/27660400.2021.1918396 }
+ }
- "Proposal for Automatic Extraction of Superconductors properties from scientific literature": [PDF](http://pubman.nims.go.jp/pubman/faces/viewItemOverviewPage.jsp?itemId=escidoc:1890245:3)
- @inproceedings{foppiano2019proposal,
- address = {Tsukuba},
- title = {Proposal for {Automatic} {Extraction} {Framework} of {Superconductors} {Related} {Information} from {Scientific} {Literature}},
- volume = {119},
- copyright = {All rights reserved},
- abstract = {The automatic collection of materials information from research papers using Natural Language Processing (NLP) is highly required for rapid materials development using big data, namely materials informatics (MI). The difficulty of this automatic collection is mainly caused by the variety of expressions in the papers, a robust system with tolerance to such variety is required to be developed. In this paper, we report an ongoing interdisciplinary work to construct a system for automatic collection of superconductor-related information from scientific literature using text mining techniques. We focused on the identification of superconducting material names and their critical temperature (Tc) key property. We discuss the construction of a prototype for extraction and linking using machine learning (ML) techniques for the physical information collection. From the evaluation using 500 sample documents, we define a baseline and a direction for future improvements.},
- language = {eng},
- booktitle = {Letters and {Technology} {News}, vol. 119, no. 66, {SC}2019-1 (no.66)},
- author = {Foppiano, Luca and Thaer, M. Dieb and Suzuki, Akira and Ishii, Masashi},
- month = may,
- year = {2019},
- note = {ISSN: 2432-6380},
- pages = {1--5}
- }
+ @inproceedings{foppiano2019proposal,
+ address = {Tsukuba},
+ title = {Proposal for {Automatic} {Extraction} {Framework} of {Superconductors} {Related} {Information} from {Scientific} {Literature}},
+ volume = {119},
+ copyright = {All rights reserved},
+ abstract = {The automatic collection of materials information from research papers using Natural Language Processing (NLP) is highly required for rapid materials development using big data, namely materials informatics (MI). The difficulty of this automatic collection is mainly caused by the variety of expressions in the papers, a robust system with tolerance to such variety is required to be developed. In this paper, we report an ongoing interdisciplinary work to construct a system for automatic collection of superconductor-related information from scientific literature using text mining techniques. We focused on the identification of superconducting material names and their critical temperature (Tc) key property. We discuss the construction of a prototype for extraction and linking using machine learning (ML) techniques for the physical information collection. From the evaluation using 500 sample documents, we define a baseline and a direction for future improvements.},
+ language = {eng},
+ booktitle = {Letters and {Technology} {News}, vol. 119, no. 66, {SC}2019-1 (no.66)},
+ author = {Foppiano, Luca and Thaer, M. Dieb and Suzuki, Akira and Ishii, Masashi},
+ month = may,
+ year = {2019},
+ note = {ISSN: 2432-6380},
+ pages = {1--5}
+ }
diff --git a/build.gradle b/build.gradle
index f70fed0e..2e60fd45 100644
--- a/build.gradle
+++ b/build.gradle
@@ -1,3 +1,5 @@
+import org.apache.tools.ant.taskdefs.condition.Os
buildscript {
repositories {
@@ -19,9 +21,10 @@ plugins {
id 'maven-publish'
id 'com.github.johnrengelman.shadow' version '7.0.0'
id "de.undercouch.download" version "4.1.1"
- id 'com.github.kt3k.coveralls' version '2.12.0'
+ id 'com.github.kt3k.coveralls' version '2.12.2'
id 'com.palantir.git-version' version '0.12.3'
id 'net.researchgate.release' version '3.0.2'
+ id "org.jetbrains.kotlin.jvm" version "1.8.21"
@@ -44,9 +47,12 @@ description = """Grobid module for extraction of superconductor information from
dependencies {
- testImplementation(platform('org.junit:junit-bom:5.8.1'))
+ testImplementation(platform('org.junit:junit-bom:5.10.2'))
+ testRuntimeOnly("org.junit.platform:junit-platform-launcher") {
+ because("Only needed to run tests in a version of IntelliJ IDEA that bundles older versions")
+ }
+ testRuntimeOnly("org.junit.jupiter:junit-jupiter-engine")
- testImplementation("junit:junit:4.13.2")
testRuntimeOnly("org.junit.vintage:junit-vintage-engine") {
because 'allows JUnit 3 and JUnit 4 tests to run'
@@ -54,16 +60,19 @@ dependencies {
testRuntimeOnly("org.junit.platform:junit-platform-launcher") {
because 'allows tests to run from IDEs that bundle older version of launcher'
- testImplementation 'org.easymock:easymock:4.3'
+ testImplementation 'org.easymock:easymock:5.2.0'
+ testImplementation 'org.hamcrest:hamcrest-all:1.3'
testImplementation 'org.hamcrest:hamcrest-library:2.2'
testImplementation 'org.powermock:powermock-module-junit4:2.0.9'
testImplementation 'org.powermock:powermock-api-easymock:2.0.9'
+ testImplementation 'org.jetbrains.kotlin:kotlin-test'
+ testImplementation "io.mockk:mockk:1.13.9"
//GROBID and grobid-quantities
- implementation 'com.github.kermitt2:grobid-quantities:0.7.2'
- implementation 'org.grobid:grobid-core:0.7.2'
- implementation 'org.grobid:grobid-trainer:0.7.2'
- implementation 'org.grobid:grobid-service:0.7.2'
+ implementation 'org.grobid:grobid-quantities:0.8.0'
+ implementation 'org.grobid:grobid-core:0.8.0'
+ implementation 'org.grobid:grobid-trainer:0.8.0'
+ implementation 'org.grobid:grobid-service:0.8.0'
implementation "xerces:xercesImpl:2.12.0"
implementation "net.arnx:jsonic:1.3.10"
implementation "net.sf.saxon:Saxon-HE:9.6.0-9"
@@ -83,25 +92,36 @@ dependencies {
implementation 'org.apache.commons:commons-text:1.10.0'
- implementation "io.dropwizard:dropwizard-core:1.3.29"
- implementation 'io.dropwizard:dropwizard-jersey:1.3.29'
- implementation "io.dropwizard:dropwizard-assets:1.3.29"
- implementation "com.hubspot.dropwizard:dropwizard-guicier:"
- implementation "io.dropwizard:dropwizard-testing:1.3.29"
- implementation "io.dropwizard:dropwizard-forms:1.3.29"
- implementation "io.dropwizard:dropwizard-client:1.3.29"
- implementation "io.dropwizard:dropwizard-auth:1.3.29"
- implementation "io.dropwizard.metrics:metrics-core:4.0.0"
- implementation "io.dropwizard.metrics:metrics-servlets:4.0.0"
+ implementation 'ru.vyarus:dropwizard-guicey:7.0.0'
+ implementation 'io.dropwizard:dropwizard-bom:4.0.0'
+ implementation 'io.dropwizard:dropwizard-core:4.0.0'
+ implementation 'io.dropwizard:dropwizard-assets:4.0.0'
+ implementation 'io.dropwizard:dropwizard-testing:4.0.0'
+ implementation 'io.dropwizard:dropwizard-forms:4.0.0'
+ implementation 'io.dropwizard:dropwizard-client:4.0.0'
+ implementation 'io.dropwizard:dropwizard-auth:4.0.0'
+ implementation 'io.dropwizard.metrics:metrics-core:4.2.22'
+ implementation 'io.dropwizard.metrics:metrics-servlets:4.2.22'
- implementation 'com.google.guava:guava:31.1-jre'
+ implementation 'com.google.guava:guava:30.1.1-jre'
implementation 'org.apache.httpcomponents:httpmime:4.5.13'
implementation 'javax.activation:activation:1.1.1'
implementation 'javax.xml.bind:jaxb-api:2.4.0-b180830.0359'
implementation 'com.sun.xml.bind:jaxb-core:4.0.1'
implementation 'com.sun.xml.bind:jaxb-impl:4.0.1'
implementation 'com.fasterxml.jackson.datatype:jackson-datatype-guava:2.13.4'
+ //Grobid-quantities
+ implementation 'tech.units:indriya:2.1.3'
+ implementation group: 'si.uom', name: 'si-units', version: '2.1'
+ implementation group: 'si.uom', name: 'si-quantity', version: '2.1'
+ implementation group: 'systems.uom', name: 'systems-quantity', version: '2.1'
+ implementation group: 'systems.uom', name: 'systems-common', version: '2.1'
+ implementation group: 'systems.uom', name: 'systems-unicode', version: '2.1'
+ implementation group: 'systems.uom', name: 'systems-ucum', version: '2.1'
+ implementation group: 'systems.uom', name: 'systems-unicode', version: '2.1'
implementation 'org.dkpro.statistics:dkpro-statistics:2.2.1'
implementation 'org.dkpro.statistics:dkpro-statistics-agreement:2.2.1'
@@ -125,9 +145,6 @@ configurations.all {
/** Other configuration **/
-sourceCompatibility = 1.8
-targetCompatibility = 1.8
tasks.withType(JavaCompile) {
options.encoding = 'UTF-8'
// options.compilerArgs << "-Xlint:deprecation"
@@ -137,9 +154,40 @@ tasks.withType(JavaCompile) {
sourceSets.main.resources {
srcDirs = ["src/main/resources", "resources/config"]
+sourceSets.test.resources {
+ srcDirs = ["src/test/resources"]
test {
exclude '**/**IntegrationTest**'
+ useJUnitPlatform()
+ maxHeapSize = "1024m"
+ def libraries = ""
+ if (Os.isFamily(Os.FAMILY_MAC)) {
+ if (Os.isArch("aarch64")) {
+ libraries = "${file("./grobid-home/lib/mac_arm-64").absolutePath}"
+ } else {
+ libraries = "${file("./grobid-home/lib/mac-64").absolutePath}"
+ }
+ } else if (Os.isFamily(Os.FAMILY_UNIX)) {
+ def jepDir = rootProject.rootDir.getAbsolutePath() + "/grobid-home/lib/lin-64/jep"
+ libraries = jepDir
+ jepDir = rootProject.rootDir.getAbsolutePath() + "/grobid-home/lib/lin-64"
+ libraries += ":" + jepDir
+ } else {
+ throw new RuntimeException("Unsupported platform!")
+ }
+ if (JavaVersion.current().compareTo(JavaVersion.VERSION_1_8) > 0) {
+ jvmArgs "--add-opens", "java.base/java.util.stream=ALL-UNNAMED",
+ "--add-opens", "java.base/java.io=ALL-UNNAMED",
+ "--add-opens", "java.base/java.lang=ALL-UNNAMED",
+ "--add-opens", "java.base/java.util.regex=ALL-UNNAMED",
+ "--add-opens", "java.base/java.math=ALL-UNNAMED",
+ "--add-opens", "java.base/java.text=ALL-UNNAMED"
+ }
+ systemProperty "java.library.path", "${System.getProperty('java.library.path')}:" + libraries
tasks.run.workingDir = rootProject.rootDir
@@ -148,6 +196,60 @@ mainClassName = 'org.grobid.service.GrobidSuperconductorsApplication'
run {
args = ['server', 'resources/config/config.yml']
+ def libraries = ""
+ if (Os.isFamily(Os.FAMILY_MAC)) {
+ if (Os.isArch("aarch64")) {
+ libraries = "${file("../grobid-home/lib/mac_arm-64").absolutePath}"
+ } else {
+ libraries = "${file("../grobid-home/lib/mac-64").absolutePath}"
+ }
+ } else if (Os.isFamily(Os.FAMILY_UNIX)) {
+ libraries = "${file("../grobid-home/lib/lin-64/jep").absolutePath}:" +
+ "${file("../grobid-home/lib/lin-64").absolutePath}:"
+ } else {
+ throw new RuntimeException("Unsupported platform!")
+ }
+ if (JavaVersion.current().compareTo(JavaVersion.VERSION_1_8) > 0) {
+ jvmArgs "--add-opens", "java.base/java.lang=ALL-UNNAMED"
+ }
+ workingDir = rootProject.rootDir
+ def javaLibraryPath = "${System.getProperty('java.library.path')}:" + libraries
+ systemProperty "java.library.path", javaLibraryPath
+task integration(type: Test) {
+ include '**'
+ maxHeapSize = "1024m"
+ def libraries = ""
+ if (Os.isFamily(Os.FAMILY_MAC)) {
+ if (Os.isArch("aarch64")) {
+ libraries = "${file("./grobid-home/lib/mac_arm-64").absolutePath}"
+ } else {
+ libraries = "${file("./grobid-home/lib/mac-64").absolutePath}"
+ }
+ } else if (Os.isFamily(Os.FAMILY_UNIX)) {
+ def jepDir = rootProject.rootDir.getAbsolutePath() + "/grobid-home/lib/lin-64/jep"
+ libraries = jepDir
+ jepDir = rootProject.rootDir.getAbsolutePath() + "/grobid-home/lib/lin-64"
+ libraries += ":" + jepDir
+ } else {
+ throw new RuntimeException("Unsupported platform!")
+ }
+ if (JavaVersion.current().compareTo(JavaVersion.VERSION_1_8) > 0) {
+ jvmArgs "--add-opens", "java.base/java.util.stream=ALL-UNNAMED",
+ "--add-opens", "java.base/java.io=ALL-UNNAMED",
+ "--add-opens", "java.base/java.lang=ALL-UNNAMED",
+ "--add-opens", "java.base/java.util.regex=ALL-UNNAMED",
+ "--add-opens", "java.base/java.math=ALL-UNNAMED",
+ "--add-opens", "java.base/java.text=ALL-UNNAMED"
+ }
+ systemProperty "java.library.path", "${System.getProperty('java.library.path')}:" + libraries
@@ -201,18 +303,14 @@ shadowJar {
jar {
- enabled false
+ enabled true
artifacts {
archives shadowJar
-// archives jar
-//distZip.archiveClassifier = 'application'
-//distTar.archiveClassifier = 'application'
-distZip.enabled = false
+distZip.enabled = true
distTar.enabled = false
shadowDistZip.enabled = false
shadowDistTar.enabled = false
@@ -230,6 +328,9 @@ publishing {
def conf = new org.yaml.snakeyaml.Yaml().load( new File("resources/config/config.yml").newInputStream() )
def grobidHome = conf.grobidHome.replace("\$", "").replace('{', "").replace("GROBID_HOME:- ", "").replace("}", "")
+if (grobidHome.startsWith("../")) {
+ grobidHome = "${rootProject.rootDir}/${grobidHome}"
/** Model management **/
@@ -244,29 +345,44 @@ task copyModels(type: Copy) {
include "**/preprocessor.json"
exclude "**/features-engineering/**"
exclude "**/result-logs/**"
- into "${rootDir}/${grobidHome}/models/"
+ into "${grobidHome}/models/"
doLast {
print "Copy models under grobid-home: ${grobidHome}"
- ant.gunzip(src: "${rootDir}/${grobidHome}/models/superconductors/model.wapiti.gz", dest: "${rootDir}/${grobidHome}/models/superconductors/")
+ ant.gunzip(src: "${grobidHome}/models/superconductors/model.wapiti.gz", dest: "${grobidHome}/models/superconductors/")
-task downloadTransformers(dependsOn: copyModels) {
+task downloadTransformersQuantities(dependsOn: copyModels) {
doLast {
download {
- src "https://kdrive.infomaniak.com/2/app/104844/share/0f902484-a529-4562-96d7-364959f364dd/files/150668/download"
- dest "${rootDir}/${grobidHome}/models/superconductors-transformers.zip"
+ src "https://transformers-data.s3.eu-central-1.amazonaws.com/quantities-transformers-240226.zip"
+ dest "${grobidHome}/models/quantities-transformers.zip"
overwrite false
print "Download bulky transformers files under grobid-home: ${grobidHome}"
- ant.unzip(src: "${rootDir}/${grobidHome}/models/superconductors-transformers.zip", dest: "${rootDir}/${grobidHome}/models/")
+ ant.unzip(src: "${grobidHome}/models/quantities-transformers.zip", dest: "${grobidHome}/models/")
+task downloadTransformers(dependsOn: copyModels) {
+ doLast {
+ download {
+ src "https://transformers-data.s3.eu-central-1.amazonaws.com/superconductors-transformers-230222.zip"
+ dest "${grobidHome}/models/superconductors-transformers.zip"
+ overwrite false
+ print "Download bulky transformers files under grobid-home: ${grobidHome}"
+ }
+ ant.unzip(src: "${grobidHome}/models/superconductors-transformers.zip", dest: "${grobidHome}/models/")
+ }
wrapper {
- gradleVersion "7.1.1"
+ gradleVersion "7.2"
+test {
+ useJUnitPlatform()
jacocoTestReport {
@@ -289,5 +405,3 @@ release {
diff --git a/docker-compose.yml b/docker-compose.yml
index eb22ca36..1a08c821 100644
--- a/docker-compose.yml
+++ b/docker-compose.yml
@@ -11,7 +11,7 @@ services:
- "cde.local"
- image: lfoppiano/grobid-superconductors-tools:2.1
+ image: lfoppiano/material-parsers:3.0.1
restart: always
- 8090:8080
@@ -27,7 +27,7 @@ services:
- image: lfoppiano/grobid-superconductors:0.5.0
+ image: lfoppiano/grobid-superconductors:0.5.3
- ./resources/config/config-docker.yml:/opt/grobid/grobid-superconductors/config.yml:ro
# - /Users/lfoppiano/development/projects/grobid/grobid-superconductors/resources/config/grobid.yaml:/opt/grobid/grobid-home/config/grobid.yaml:ro
diff --git a/gradle.properties b/gradle.properties
index bfec3755..5aef8ae5 100644
--- a/gradle.properties
+++ b/gradle.properties
@@ -1,7 +1,8 @@
org.gradle.caching = true
org.gradle.parallel = true
org.gradle.vfs.watch = true
diff --git a/gradle/wrapper/gradle-wrapper.properties b/gradle/wrapper/gradle-wrapper.properties
index 05679dc3..ffed3a25 100644
--- a/gradle/wrapper/gradle-wrapper.properties
+++ b/gradle/wrapper/gradle-wrapper.properties
@@ -1,5 +1,5 @@
diff --git a/gradlew b/gradlew
index 4f906e0c..1b6c7873 100755
--- a/gradlew
+++ b/gradlew
@@ -1,7 +1,7 @@
-#!/usr/bin/env sh
-# Copyright 2015 the original author or authors.
+# Copyright © 2015-2021 the original authors.
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
@@ -17,67 +17,101 @@
-## Gradle start up script for UN*X
+# Gradle start up script for POSIX generated by Gradle.
+# Important for running:
+# (1) You need a POSIX-compliant shell to run this script. If your /bin/sh is
+# noncompliant, but you have some other compliant shell such as ksh or
+# bash, then to run this script, type that shell name before the whole
+# command line, like:
+# ksh Gradle
+# Busybox and similar reduced shells will NOT work, because this script
+# requires all of these POSIX shell features:
+# * functions;
+# * expansions «$var», «${var}», «${var:-default}», «${var+SET}»,
+# «${var#prefix}», «${var%suffix}», and «$( cmd )»;
+# * compound commands having a testable exit status, especially «case»;
+# * various built-in commands including «command», «set», and «ulimit».
+# Important for patching:
+# (2) This script targets any POSIX shell, so it avoids extensions provided
+# by Bash, Ksh, etc; in particular arrays are avoided.
+# The "traditional" practice of packing multiple parameters into a
+# space-separated string is a well documented source of bugs and security
+# problems, so this is (mostly) avoided, by progressively accumulating
+# options in "$@", and eventually passing that to Java.
+# Where the inherited environment variables (DEFAULT_JVM_OPTS, JAVA_OPTS,
+# and GRADLE_OPTS) rely on word-splitting, this is performed explicitly;
+# see the in-line comments for details.
+# There are tweaks for specific operating systems such as AIX, CygWin,
+# Darwin, MinGW, and NonStop.
+# (3) This script is generated from the Groovy template
+# https://github.com/gradle/gradle/blob/master/subprojects/plugins/src/main/resources/org/gradle/api/internal/plugins/unixStartScript.txt
+# within the Gradle project.
+# You can find Gradle at https://github.com/gradle/gradle/.
# Attempt to set APP_HOME
# Resolve links: $0 may be a link
-# Need this for relative symlinks.
-while [ -h "$PRG" ] ; do
- ls=`ls -ld "$PRG"`
- link=`expr "$ls" : '.*-> \(.*\)$'`
- if expr "$link" : '/.*' > /dev/null; then
- PRG="$link"
- else
- PRG=`dirname "$PRG"`"/$link"
- fi
+# Need this for daisy-chained symlinks.
+ APP_HOME=${app_path%"${app_path##*/}"} # leaves a trailing /; empty if no leading path
+ [ -h "$app_path" ]
+ ls=$( ls -ld "$app_path" )
+ link=${ls#*' -> '}
+ case $link in #(
+ /*) app_path=$link ;; #(
+ *) app_path=$APP_HOME$link ;;
+ esac
-cd "`dirname \"$PRG\"`/" >/dev/null
-APP_HOME="`pwd -P`"
-cd "$SAVED" >/dev/null
+APP_HOME=$( cd "${APP_HOME:-./}" && pwd -P ) || exit
-APP_BASE_NAME=`basename "$0"`
# Add default JVM options here. You can also use JAVA_OPTS and GRADLE_OPTS to pass JVM options to this script.
DEFAULT_JVM_OPTS='"-Xmx64m" "-Xms64m"'
# Use the maximum available, or set MAX_FD != -1 to use that value.
warn () {
echo "$*"
+} >&2
die () {
echo "$*"
exit 1
+} >&2
# OS specific support (must be 'true' or 'false').
-case "`uname`" in
- cygwin=true
- ;;
- Darwin* )
- darwin=true
- ;;
- MINGW* )
- msys=true
- ;;
- nonstop=true
- ;;
+case "$( uname )" in #(
+ CYGWIN* ) cygwin=true ;; #(
+ Darwin* ) darwin=true ;; #(
+ MSYS* | MINGW* ) msys=true ;; #(
+ NONSTOP* ) nonstop=true ;;
@@ -87,9 +121,9 @@ CLASSPATH=$APP_HOME/gradle/wrapper/gradle-wrapper.jar
if [ -n "$JAVA_HOME" ] ; then
if [ -x "$JAVA_HOME/jre/sh/java" ] ; then
# IBM's JDK on AIX uses strange locations for the executables
- JAVACMD="$JAVA_HOME/jre/sh/java"
+ JAVACMD=$JAVA_HOME/jre/sh/java
- JAVACMD="$JAVA_HOME/bin/java"
if [ ! -x "$JAVACMD" ] ; then
die "ERROR: JAVA_HOME is set to an invalid directory: $JAVA_HOME
@@ -98,7 +132,7 @@ Please set the JAVA_HOME variable in your environment to match the
location of your Java installation."
- JAVACMD="java"
+ JAVACMD=java
which java >/dev/null 2>&1 || die "ERROR: JAVA_HOME is not set and no 'java' command could be found in your PATH.
Please set the JAVA_HOME variable in your environment to match the
@@ -106,80 +140,95 @@ location of your Java installation."
# Increase the maximum file descriptors if we can.
-if [ "$cygwin" = "false" -a "$darwin" = "false" -a "$nonstop" = "false" ] ; then
- MAX_FD_LIMIT=`ulimit -H -n`
- if [ $? -eq 0 ] ; then
- if [ "$MAX_FD" = "maximum" -o "$MAX_FD" = "max" ] ; then
- fi
- ulimit -n $MAX_FD
- if [ $? -ne 0 ] ; then
- warn "Could not set maximum file descriptor limit: $MAX_FD"
- fi
- else
- warn "Could not query maximum file descriptor limit: $MAX_FD_LIMIT"
- fi
+if ! "$cygwin" && ! "$darwin" && ! "$nonstop" ; then
+ case $MAX_FD in #(
+ max*)
+ MAX_FD=$( ulimit -H -n ) ||
+ warn "Could not query maximum file descriptor limit"
+ esac
+ case $MAX_FD in #(
+ '' | soft) :;; #(
+ *)
+ ulimit -n "$MAX_FD" ||
+ warn "Could not set maximum file descriptor limit to $MAX_FD"
+ esac
-# For Darwin, add options to specify how the application appears in the dock
-if $darwin; then
- GRADLE_OPTS="$GRADLE_OPTS \"-Xdock:name=$APP_NAME\" \"-Xdock:icon=$APP_HOME/media/gradle.icns\""
+# Collect all arguments for the java command, stacking in reverse order:
+# * args from the command line
+# * the main class name
+# * -classpath
+# * -D...appname settings
+# * --module-path (only if needed)
+# * DEFAULT_JVM_OPTS, JAVA_OPTS, and GRADLE_OPTS environment variables.
# For Cygwin or MSYS, switch paths to Windows format before running java
-if [ "$cygwin" = "true" -o "$msys" = "true" ] ; then
- APP_HOME=`cygpath --path --mixed "$APP_HOME"`
- CLASSPATH=`cygpath --path --mixed "$CLASSPATH"`
- JAVACMD=`cygpath --unix "$JAVACMD"`
- # We build the pattern for arguments to be converted via cygpath
- ROOTDIRSRAW=`find -L / -maxdepth 1 -mindepth 1 -type d 2>/dev/null`
- SEP=""
- for dir in $ROOTDIRSRAW ; do
- SEP="|"
- done
- # Add a user-defined pattern to the cygpath arguments
- if [ "$GRADLE_CYGPATTERN" != "" ] ; then
- fi
+if "$cygwin" || "$msys" ; then
+ APP_HOME=$( cygpath --path --mixed "$APP_HOME" )
+ CLASSPATH=$( cygpath --path --mixed "$CLASSPATH" )
+ JAVACMD=$( cygpath --unix "$JAVACMD" )
# Now convert the arguments - kludge to limit ourselves to /bin/sh
- i=0
- for arg in "$@" ; do
- CHECK=`echo "$arg"|egrep -c "$OURCYGPATTERN" -`
- CHECK2=`echo "$arg"|egrep -c "^-"` ### Determine if an option
- if [ $CHECK -ne 0 ] && [ $CHECK2 -eq 0 ] ; then ### Added a condition
- eval `echo args$i`=`cygpath --path --ignore --mixed "$arg"`
- else
- eval `echo args$i`="\"$arg\""
+ for arg do
+ if
+ case $arg in #(
+ -*) false ;; # don't mess with options #(
+ /?*) t=${arg#/} t=/${t%%/*} # looks like a POSIX filepath
+ [ -e "$t" ] ;; #(
+ *) false ;;
+ esac
+ then
+ arg=$( cygpath --path --ignore --mixed "$arg" )
- i=`expr $i + 1`
+ # Roll the args list around exactly as many times as the number of
+ # args, so each arg winds up back in the position where it started, but
+ # possibly modified.
+ #
+ # NB: a `for` loop captures its iteration list before it begins, so
+ # changing the positional parameters here affects neither the number of
+ # iterations, nor the values presented in `arg`.
+ shift # remove old arg
+ set -- "$@" "$arg" # push replacement arg
- case $i in
- 0) set -- ;;
- 1) set -- "$args0" ;;
- 2) set -- "$args0" "$args1" ;;
- 3) set -- "$args0" "$args1" "$args2" ;;
- 4) set -- "$args0" "$args1" "$args2" "$args3" ;;
- 5) set -- "$args0" "$args1" "$args2" "$args3" "$args4" ;;
- 6) set -- "$args0" "$args1" "$args2" "$args3" "$args4" "$args5" ;;
- 7) set -- "$args0" "$args1" "$args2" "$args3" "$args4" "$args5" "$args6" ;;
- 8) set -- "$args0" "$args1" "$args2" "$args3" "$args4" "$args5" "$args6" "$args7" ;;
- 9) set -- "$args0" "$args1" "$args2" "$args3" "$args4" "$args5" "$args6" "$args7" "$args8" ;;
- esac
-# Escape application args
-save () {
- for i do printf %s\\n "$i" | sed "s/'/'\\\\''/g;1s/^/'/;\$s/\$/' \\\\/" ; done
- echo " "
-APP_ARGS=`save "$@"`
+# Collect all arguments for the java command;
+# * $DEFAULT_JVM_OPTS, $JAVA_OPTS, and $GRADLE_OPTS can contain fragments of
+# shell script including quotes and variable substitutions, so put them in
+# double quotes to make sure that they get re-expanded; and
+# * put everything else in single quotes, so that it's not re-expanded.
+set -- \
+ "-Dorg.gradle.appname=$APP_BASE_NAME" \
+ -classpath "$CLASSPATH" \
+ org.gradle.wrapper.GradleWrapperMain \
+ "$@"
+# Use "xargs" to parse quoted args.
+# With -n1 it outputs one arg per line, with the quotes and backslashes removed.
+# In Bash we could simply go:
+# readarray ARGS < <( xargs -n1 <<<"$var" ) &&
+# set -- "${ARGS[@]}" "$@"
+# but POSIX shell has neither arrays nor command substitution, so instead we
+# post-process each arg (as a line of input to sed) to backslash-escape any
+# character that might be a shell metacharacter, then use eval to reverse
+# that process (while maintaining the separation between arguments), and wrap
+# the whole thing up as a single "set" statement.
+# This will of course break if any of these variables contains a newline or
+# an unmatched quote.
-# Collect all arguments for the java command, following the shell quoting and substitution rules
-eval set -- $DEFAULT_JVM_OPTS $JAVA_OPTS $GRADLE_OPTS "\"-Dorg.gradle.appname=$APP_BASE_NAME\"" -classpath "\"$CLASSPATH\"" org.gradle.wrapper.GradleWrapperMain "$APP_ARGS"
+eval "set -- $(
+ xargs -n1 |
+ sed ' s~[^-[:alnum:]+,./:=@_]~\\&~g; ' |
+ tr '\n' ' '
+ )" '"$@"'
exec "$JAVACMD" "$@"
diff --git a/resources/config/config-docker.yml b/resources/config/config-docker.yml
index 37a5ee27..336206dc 100755
--- a/resources/config/config-docker.yml
+++ b/resources/config/config-docker.yml
@@ -27,12 +27,12 @@ consolidation:
# empty value will disable the data consolidation
service: "glutton"
- url: "http://falcon.nims.go.jp/glutton"
+ url: "http://falcon.nims.go.jp/glutton/lookup"
- name: "superconductors"
- engine: "wapiti"
- # engine: "delft"
+# engine: "wapiti"
+ engine: "delft"
# wapiti training parameters, they will be used at training time only
epsilon: 0.00001
@@ -41,20 +41,22 @@ models:
# deep learning parameters
# architecture: "BidLSTM_CRF"
- architecture: "scibert"
- embeddings_name: "glove-840B"
+ architecture: "BERT_CRF"
+# embeddings_name: "glove-840B"
# parameters used at runtime/prediction
- max_sequence_length: 3000
+ max_sequence_length: 512
batch_size: 4
- name: "material"
- engine: "wapiti"
+ engine: "delft"
# wapiti training parameters, they will be used at training time only
epsilon: 0.00001
window: 30
nbMaxIterations: 2000
+ delft:
+ architecture: "BERT_CRF"
- name: "entityLinker-material-tcValue"
engine: "wapiti"
@@ -81,42 +83,58 @@ models:
nbMaxIterations: 2000
- name: "quantities"
- engine: "wapiti"
+ engine: "delft"
+# engine: "wapiti"
# wapiti training parameters, they will be used at training time only
epsilon: 0.00001
window: 30
nbMaxIterations: 2000
+ delft:
+# architecture: "BidLSTM_CRF_FEATURES"
+ architecture: "BERT_CRF"
+ useELMo: false
+ embeddings_name: "glove-840B"
- name: "units"
- engine: "wapiti"
+ engine: "delft"
+# engine: "wapiti"
# wapiti training parameters, they will be used at training time only
epsilon: 0.00001
window: 30
nbMaxIterations: 2000
+ delft:
+ architecture: "BidLSTM_CRF_FEATURES"
+ useELMo: false
+ embeddings_name: "glove-840B"
- name: "values"
- engine: "wapiti"
+ engine: "delft"
+# engine: "wapiti"
# wapiti training parameters, they will be used at training time only
epsilon: 0.00001
window: 30
nbMaxIterations: 2000
+ delft:
+ architecture: "BidLSTM_CRF_FEATURES"
+ useELMo: false
+ embeddings_name: "glove-840B"
type: custom
- idleTimeout: 120 seconds
- type: http
port: 8072
+ idleTimeout: 120 seconds
- type: http
port: 8073
registerDefaultExceptionMappers: false
- level: DEBUG
+ level: WARN
# Logger-specific levels.
@@ -128,6 +146,4 @@ logging:
- type: console
threshold: INFO
-version: 2
-timeZone: UTC
+ timeZone: UTC
\ No newline at end of file
diff --git a/resources/config/config.yml b/resources/config/config.yml
index fdcd4a0c..c8520fe7 100755
--- a/resources/config/config.yml
+++ b/resources/config/config.yml
@@ -31,8 +31,8 @@ consolidation:
- name: "superconductors"
- engine: "wapiti"
-# engine: "delft"
+# engine: "wapiti"
+ engine: "delft"
# wapiti training parameters, they will be used at training time only
epsilon: 0.00001
@@ -49,12 +49,14 @@ models:
batch_size: 4
- name: "material"
- engine: "wapiti"
+ engine: "delft"
# wapiti training parameters, they will be used at training time only
epsilon: 0.00001
window: 30
nbMaxIterations: 2000
+ delft:
+ architecture: "BERT_CRF"
- name: "entityLinker-material-tcValue"
engine: "wapiti"
@@ -121,10 +123,10 @@ models:
type: custom
- idleTimeout: 120 seconds
- type: http
port: 8072
+ idleTimeout: 120 seconds
- type: http
port: 8073
@@ -143,6 +145,7 @@ logging:
- type: console
threshold: INFO
+ timeZone: UTC
# The following line is used to remove the logger in the docker image, please don't modify it
- type: file
@@ -154,6 +157,3 @@ logging:
timeZone: UTC
maxFileSize: 50MB
-version: 2
-timeZone: UTC
diff --git a/resources/models/grobid-superconductors-positive_sampling-all-BidLSTM_CRF_FEATURES-with_ELMo/config.json b/resources/models/grobid-superconductors-positive_sampling-all-BidLSTM_CRF_FEATURES-with_ELMo/config.json
new file mode 100644
index 00000000..5e81a154
--- /dev/null
+++ b/resources/models/grobid-superconductors-positive_sampling-all-BidLSTM_CRF_FEATURES-with_ELMo/config.json
@@ -0,0 +1,91 @@
+ "model_name": "grobid-superconductors-positive_sampling-all-BidLSTM_CRF_FEATURES-with_ELMo",
+ "architecture": "BidLSTM_CRF_FEATURES",
+ "embeddings_name": "glove-840B",
+ "char_vocab_size": 227,
+ "case_vocab_size": 8,
+ "char_embedding_size": 25,
+ "num_char_lstm_units": 25,
+ "max_char_length": 30,
+ "features_vocabulary_size": 12,
+ "features_indices": [
+ 9,
+ 10,
+ 11,
+ 12,
+ 16,
+ 17,
+ 18,
+ 19,
+ 20,
+ 21
+ ],
+ "features_embedding_size": 4,
+ "features_lstm_units": 4,
+ "max_sequence_length": 3000,
+ "word_embedding_size": 1324,
+ "num_word_lstm_units": 100,
+ "case_embedding_size": 5,
+ "dropout": 0.5,
+ "recurrent_dropout": 0.5,
+ "use_crf": true,
+ "use_chain_crf": false,
+ "fold_number": 1,
+ "batch_size": 20,
+ "transformer_name": null,
+ "use_ELMo": true,
+ "features_map_to_index": {
+ "9": {
+ "ALLCAPS": 1,
+ "INITCAP": 2,
+ "NOCAPS": 3
+ },
+ "10": {
+ "ALLDIGIT": 13,
+ "ALLDIGITS": 14,
+ "NODIGIT": 16
+ },
+ "11": {
+ "0": 25,
+ "1": 26
+ },
+ "12": {
+ "COMMA": 37,
+ "DOT": 38,
+ "HYPHEN": 40,
+ "NOPUNCT": 41,
+ "PUNCT": 43,
+ "QUOTE": 44
+ },
+ "16": {
+ "SAMEFONT": 50,
+ "SAxMEFONT": 51
+ },
+ "17": {
+ "LOWERFONT": 62,
+ },
+ "18": {
+ "false": 73,
+ "true": 74
+ },
+ "19": {
+ "false": 85,
+ "true": 86
+ },
+ "20": {
+ "BASELINE": 97,
+ "SUBSCRIPT": 98,
+ },
+ "21": {
+ "false": 109,
+ "true": 110
+ }
+ }
\ No newline at end of file
diff --git a/resources/models/grobid-superconductors-positive_sampling-all-BidLSTM_CRF_FEATURES-with_ELMo/preprocessor.json b/resources/models/grobid-superconductors-positive_sampling-all-BidLSTM_CRF_FEATURES-with_ELMo/preprocessor.json
new file mode 100644
index 00000000..ee885822
--- /dev/null
+++ b/resources/models/grobid-superconductors-positive_sampling-all-BidLSTM_CRF_FEATURES-with_ELMo/preprocessor.json
@@ -0,0 +1,350 @@
+ "padding": true,
+ "return_lengths": true,
+ "return_word_embeddings": true,
+ "return_casing": false,
+ "return_features": true,
+ "return_chars": true,
+ "return_bert_embeddings": false,
+ "vocab_char": {
+ "": 0,
+ "": 1,
+ "!": 2,
+ "\"": 3,
+ "#": 4,
+ "$": 5,
+ "%": 6,
+ "&": 7,
+ "'": 8,
+ "(": 9,
+ ")": 10,
+ "*": 11,
+ "+": 12,
+ ",": 13,
+ "-": 14,
+ ".": 15,
+ "/": 16,
+ "0": 17,
+ "1": 18,
+ "2": 19,
+ "3": 20,
+ "4": 21,
+ "5": 22,
+ "6": 23,
+ "7": 24,
+ "8": 25,
+ "9": 26,
+ ":": 27,
+ ";": 28,
+ "<": 29,
+ "=": 30,
+ ">": 31,
+ "?": 32,
+ "@": 33,
+ "A": 34,
+ "B": 35,
+ "C": 36,
+ "D": 37,
+ "E": 38,
+ "F": 39,
+ "G": 40,
+ "H": 41,
+ "I": 42,
+ "J": 43,
+ "K": 44,
+ "L": 45,
+ "M": 46,
+ "N": 47,
+ "O": 48,
+ "P": 49,
+ "Q": 50,
+ "R": 51,
+ "S": 52,
+ "T": 53,
+ "U": 54,
+ "V": 55,
+ "W": 56,
+ "X": 57,
+ "Y": 58,
+ "Z": 59,
+ "[": 60,
+ "]": 61,
+ "_": 62,
+ "`": 63,
+ "a": 64,
+ "b": 65,
+ "c": 66,
+ "d": 67,
+ "e": 68,
+ "f": 69,
+ "g": 70,
+ "h": 71,
+ "i": 72,
+ "j": 73,
+ "k": 74,
+ "l": 75,
+ "m": 76,
+ "n": 77,
+ "o": 78,
+ "p": 79,
+ "q": 80,
+ "r": 81,
+ "s": 82,
+ "t": 83,
+ "u": 84,
+ "v": 85,
+ "w": 86,
+ "x": 87,
+ "y": 88,
+ "z": 89,
+ "{": 90,
+ "|": 91,
+ "}": 92,
+ "~": 93,
+ "\u00a9": 94,
+ "\u00ab": 95,
+ "\u00b0": 96,
+ "\u00b1": 97,
+ "\u00b4": 98,
+ "\u00b5": 99,
+ "\u00b7": 100,
+ "\u00ba": 101,
+ "\u00bb": 102,
+ "\u00bc": 103,
+ "\u00bd": 104,
+ "\u00c0": 105,
+ "\u00c2": 106,
+ "\u00c3": 107,
+ "\u00c5": 108,
+ "\u00c8": 109,
+ "\u00d0": 110,
+ "\u00d7": 111,
+ "\u00d8": 112,
+ "\u00d9": 113,
+ "\u00de": 114,
+ "\u00df": 115,
+ "\u00e1": 116,
+ "\u00e2": 117,
+ "\u00e3": 118,
+ "\u00e4": 119,
+ "\u00e8": 120,
+ "\u00e9": 121,
+ "\u00eb": 122,
+ "\u00ec": 123,
+ "\u00ee": 124,
+ "\u00f0": 125,
+ "\u00f1": 126,
+ "\u00f6": 127,
+ "\u00f8": 128,
+ "\u00fc": 129,
+ "\u00fe": 130,
+ "\u0109": 131,
+ "\u01eb": 132,
+ "\u01fa": 133,
+ "\u02da": 134,
+ "\u0351": 135,
+ "\u0352": 136,
+ "\u035e": 137,
+ "\u0393": 138,
+ "\u0394": 139,
+ "\u0398": 140,
+ "\u039b": 141,
+ "\u03a6": 142,
+ "\u03a8": 143,
+ "\u03a9": 144,
+ "\u03b1": 145,
+ "\u03b2": 146,
+ "\u03b3": 147,
+ "\u03b4": 148,
+ "\u03b5": 149,
+ "\u03b6": 150,
+ "\u03b7": 151,
+ "\u03b8": 152,
+ "\u03ba": 153,
+ "\u03bb": 154,
+ "\u03bc": 155,
+ "\u03bd": 156,
+ "\u03be": 157,
+ "\u03c0": 158,
+ "\u03c1": 159,
+ "\u03c3": 160,
+ "\u03c4": 161,
+ "\u03c6": 162,
+ "\u03c7": 163,
+ "\u03c9": 164,
+ "\u03f3": 165,
+ "\u2022": 166,
+ "\u2026": 167,
+ "\u2032": 168,
+ "\u2113": 169,
+ "\u2126": 170,
+ "\u2190": 171,
+ "\u2192": 172,
+ "\u2194": 173,
+ "\u21d4": 174,
+ "\u21e0": 175,
+ "\u2202": 176,
+ "\u2206": 177,
+ "\u2212": 178,
+ "\u221a": 179,
+ "\u221d": 180,
+ "\u221e": 181,
+ "\u222b": 182,
+ "\u223c": 183,
+ "\u2243": 184,
+ "\u2245": 185,
+ "\u2248": 186,
+ "\u2260": 187,
+ "\u2261": 188,
+ "\u2264": 189,
+ "\u2265": 190,
+ "\u226a": 191,
+ "\u226b": 192,
+ "\u2272": 193,
+ "\u22a5": 194,
+ "\u22c5": 195,
+ "\u22c6": 196,
+ "\u23a2": 197,
+ "\u2500": 198,
+ "\u25b3": 199,
+ "\uf02d": 200,
+ "\uf03c": 201,
+ "\uf03e": 202,
+ "\uf044": 203,
+ "\uf057": 204,
+ "\uf05e": 205,
+ "\uf061": 206,
+ "\uf062": 207,
+ "\uf063": 208,
+ "\uf064": 209,
+ "\uf067": 210,
+ "\uf06c": 211,
+ "\uf06d": 212,
+ "\uf070": 213,
+ "\uf072": 214,
+ "\uf073": 215,
+ "\uf077": 216,
+ "\uf0a0": 217,
+ "\uf0a3": 218,
+ "\uf0b3": 219,
+ "\uf0b4": 220,
+ "\uf0b5": 221,
+ "\uf0b6": 222,
+ "\uf0bb": 223,
+ "\uf8ef": 224,
+ "\uff05": 225,
+ "\uff0e": 226
+ },
+ "vocab_tag": {
+ "": 0,
+ "B-": 1,
+ "B-": 2,
+ "B-": 3,
+ "B-": 4,
+ "B-": 5,
+ "B-": 6,
+ "I-": 7,
+ "I-": 8,
+ "I-": 9,
+ "I-": 10,
+ "I-": 11,
+ "I-": 12,
+ "O": 13
+ },
+ "vocab_case": [
+ "",
+ "numeric",
+ "allLower",
+ "allUpper",
+ "initialUpper",
+ "other",
+ "mainly_numeric",
+ "contains_digit"
+ ],
+ "max_char_length": 30,
+ "feature_preprocessor": {
+ "features_vocabulary_size": 12,
+ "features_indices": [
+ 9,
+ 10,
+ 11,
+ 12,
+ 16,
+ 17,
+ 18,
+ 19,
+ 20,
+ 21
+ ],
+ "features_map_to_index": {
+ "9": {
+ "ALLCAPS": 1,
+ "INITCAP": 2,
+ "NOCAPS": 3
+ },
+ "10": {
+ "ALLDIGIT": 13,
+ "ALLDIGITS": 14,
+ "NODIGIT": 16
+ },
+ "11": {
+ "0": 25,
+ "1": 26
+ },
+ "12": {
+ "COMMA": 37,
+ "DOT": 38,
+ "HYPHEN": 40,
+ "NOPUNCT": 41,
+ "PUNCT": 43,
+ "QUOTE": 44
+ },
+ "16": {
+ "SAMEFONT": 50,
+ "SAxMEFONT": 51
+ },
+ "17": {
+ "LOWERFONT": 62,
+ },
+ "18": {
+ "false": 73,
+ "true": 74
+ },
+ "19": {
+ "false": 85,
+ "true": 86
+ },
+ "20": {
+ "BASELINE": 97,
+ "SUBSCRIPT": 98,
+ },
+ "21": {
+ "false": 109,
+ "true": 110
+ }
+ }
+ },
+ "indice_tag": {
+ "0": "",
+ "1": "B-",
+ "2": "B-",
+ "3": "B-",
+ "4": "B-",
+ "5": "B-",
+ "6": "B-",
+ "7": "I-",
+ "8": "I-",
+ "9": "I-",
+ "10": "I-",
+ "11": "I-",
+ "12": "I-",
+ "13": "O"
+ }
\ No newline at end of file
diff --git a/resources/models/material-BERT_CRF/preprocessor.json b/resources/models/material-BERT_CRF/preprocessor.json
new file mode 100644
index 00000000..261072bc
--- /dev/null
+++ b/resources/models/material-BERT_CRF/preprocessor.json
@@ -0,0 +1,186 @@
+ "padding": true,
+ "return_lengths": false,
+ "return_word_embeddings": false,
+ "return_casing": false,
+ "return_features": false,
+ "return_chars": false,
+ "return_bert_embeddings": true,
+ "vocab_char": {
+ "": 0,
+ "": 1,
+ "\"": 2,
+ "$": 3,
+ "%": 4,
+ "'": 5,
+ "(": 6,
+ ")": 7,
+ "*": 8,
+ "+": 9,
+ ",": 10,
+ "-": 11,
+ ".": 12,
+ "/": 13,
+ "0": 14,
+ "1": 15,
+ "2": 16,
+ "3": 17,
+ "4": 18,
+ "5": 19,
+ "6": 20,
+ "7": 21,
+ "8": 22,
+ "9": 23,
+ ":": 24,
+ ";": 25,
+ "<": 26,
+ "=": 27,
+ ">": 28,
+ "A": 29,
+ "B": 30,
+ "C": 31,
+ "D": 32,
+ "E": 33,
+ "F": 34,
+ "G": 35,
+ "H": 36,
+ "I": 37,
+ "K": 38,
+ "L": 39,
+ "M": 40,
+ "N": 41,
+ "O": 42,
+ "P": 43,
+ "Q": 44,
+ "R": 45,
+ "S": 46,
+ "T": 47,
+ "U": 48,
+ "V": 49,
+ "W": 50,
+ "X": 51,
+ "Y": 52,
+ "Z": 53,
+ "[": 54,
+ "]": 55,
+ "_": 56,
+ "a": 57,
+ "b": 58,
+ "c": 59,
+ "d": 60,
+ "e": 61,
+ "f": 62,
+ "g": 63,
+ "h": 64,
+ "i": 65,
+ "j": 66,
+ "k": 67,
+ "l": 68,
+ "m": 69,
+ "n": 70,
+ "o": 71,
+ "p": 72,
+ "q": 73,
+ "r": 74,
+ "s": 75,
+ "t": 76,
+ "u": 77,
+ "v": 78,
+ "w": 79,
+ "x": 80,
+ "y": 81,
+ "z": 82,
+ "~": 83,
+ "\u00b1": 84,
+ "\u00bc": 85,
+ "\u00c0": 86,
+ "\u00c5": 87,
+ "\u00d7": 88,
+ "\u00e9": 89,
+ "\u0351": 90,
+ "\u0352": 91,
+ "\u03b1": 92,
+ "\u03b2": 93,
+ "\u03b3": 94,
+ "\u03b4": 95,
+ "\u03ba": 96,
+ "\u03ea": 97,
+ "\u03ed": 98,
+ "\u0440": 99,
+ "\u060a": 100,
+ "\u2022": 101,
+ "\u2032": 102,
+ "\u2190": 103,
+ "\u2192": 104,
+ "\u2194": 105,
+ "\u2206": 106,
+ "\u2212": 107,
+ "\u223c": 108,
+ "\u2243": 109,
+ "\u2248": 110,
+ "\u2264": 111,
+ "\u2265": 112,
+ "\u22c5": 113,
+ "\u2426": 114,
+ "\uf02d": 115,
+ "\uf03e": 116,
+ "\uf064": 117,
+ "\uf06c": 118,
+ "\uf0a0": 119,
+ "\uf0b3": 120,
+ "\uf0bb": 121,
+ "\uff0e": 122
+ },
+ "vocab_tag": {
+ "": 0,
+ "B-": 1,
+ "B-": 2,
+ "B-": 3,
+ "B-": 4,
+ "B-": 5,
+ "B-": 6,
+ "B-": 7,
+ "B-": 8,
+ "I-": 9,
+ "I-": 10,
+ "I-": 11,
+ "I-": 12,
+ "I-": 13,
+ "I-": 14,
+ "I-": 15,
+ "I-": 16,
+ "O": 17
+ },
+ "vocab_case": [
+ "",
+ "numeric",
+ "allLower",
+ "allUpper",
+ "initialUpper",
+ "other",
+ "mainly_numeric",
+ "contains_digit"
+ ],
+ "max_char_length": 30,
+ "feature_preprocessor": null,
+ "indice_tag": {
+ "0": "",
+ "1": "B-",
+ "2": "B-",
+ "3": "B-",
+ "4": "B-",
+ "5": "B-",
+ "6": "B-",
+ "7": "B-",
+ "8": "B-",
+ "9": "I-",
+ "10": "I-",
+ "11": "I-",
+ "12": "I-",
+ "13": "I-",
+ "14": "I-",
+ "15": "I-",
+ "16": "I-",
+ "17": "O"
+ }
\ No newline at end of file
diff --git a/src/main/java/org/grobid/core/analyzers/DeepAnalyzer.java b/src/main/java/org/grobid/core/analyzers/DeepAnalyzer.java
index 34d1df25..c5ad7293 100644
--- a/src/main/java/org/grobid/core/analyzers/DeepAnalyzer.java
+++ b/src/main/java/org/grobid/core/analyzers/DeepAnalyzer.java
@@ -1,5 +1,6 @@
package org.grobid.core.analyzers;
+import org.apache.commons.lang3.NotImplementedException;
import org.apache.commons.lang3.StringUtils;
import org.grobid.core.lang.Language;
import org.grobid.core.layout.LayoutToken;
@@ -88,6 +89,21 @@ public List tokenizeWithLayoutToken(String text) {
return result;
+ @Override
+ public List retokenizeSubdigits(List list) {
+ throw new NotImplementedException("Not yet implemented");
+ }
+ @Override
+ public List retokenizeSubdigitsWithLayoutToken(List list) {
+ throw new NotImplementedException("Not yet implemented");
+ }
+ @Override
+ public List retokenizeSubdigitsFromLayoutToken(List list) {
+ throw new NotImplementedException("Not yet implemented");
+ }
public List retokenize(List chunks) {
List result = new ArrayList<>();
for (String chunk : chunks) {
diff --git a/src/main/java/org/grobid/core/data/document/DocumentBlock.java b/src/main/java/org/grobid/core/data/document/DocumentBlock.java
index 664c2229..8162c447 100644
--- a/src/main/java/org/grobid/core/data/document/DocumentBlock.java
+++ b/src/main/java/org/grobid/core/data/document/DocumentBlock.java
@@ -54,6 +54,11 @@ public DocumentBlock(List layoutTokens, String section, String subS
this.markers = new ArrayList<>(markers);
+ public DocumentBlock(List layoutTokens, String section, String subSection, String groupId, List spanList, List> markers) {
+ this(layoutTokens, section, subSection, spanList, markers);
+ this.groupId = groupId;
+ }
public String getSubSection() {
return subSection;
diff --git a/src/main/java/org/grobid/core/data/material/ChemicalComposition.java b/src/main/java/org/grobid/core/data/material/ChemicalComposition.java
index f64e71b9..878bc190 100644
--- a/src/main/java/org/grobid/core/data/material/ChemicalComposition.java
+++ b/src/main/java/org/grobid/core/data/material/ChemicalComposition.java
@@ -12,6 +12,10 @@ public class ChemicalComposition {
private String formula;
private String name;
+ private Integer code;
+ private String message;
public String getFormula() {
return formula;
@@ -38,7 +42,7 @@ public void setComposition(Map composition) {
public boolean isEmpty() {
- return StringUtils.isBlank(formula) && StringUtils.isBlank(name) && composition.keySet().size() == 0;
+ return StringUtils.isBlank(formula) && StringUtils.isBlank(name) && composition.keySet().isEmpty();
@@ -62,4 +66,20 @@ public boolean equals(Object o) {
public int hashCode() {
return Objects.hash(composition, formula, name);
+ public Integer getCode() {
+ return code;
+ }
+ public void setCode(Integer code) {
+ this.code = code;
+ }
+ public String getMessage() {
+ return message;
+ }
+ public void setMessage(String message) {
+ this.message = message;
+ }
diff --git a/src/main/java/org/grobid/core/data/material/Material.java b/src/main/java/org/grobid/core/data/material/Material.java
index 425fffc9..866ed565 100644
--- a/src/main/java/org/grobid/core/data/material/Material.java
+++ b/src/main/java/org/grobid/core/data/material/Material.java
@@ -182,7 +182,7 @@ public static List resolveVariables(Material material) {
// }
try {
- generatePermutations(mapOfContainedVariables, new ArrayList(containedVariables), outputFormulasString, Pair.of(0, 0), material.getFormula().getRawValue());
+ generatePermutations(mapOfContainedVariables, new ArrayList<>(containedVariables), outputFormulasString, Pair.of(0, 0), material.getFormula().getRawValue());
} catch (NumberFormatException e) {
Map> cleanedMapOfContainedVariables = new HashMap<>();
@@ -194,7 +194,7 @@ public static List resolveVariables(Material material) {
try {
- generatePermutations(cleanedMapOfContainedVariables, new ArrayList(containedVariables), outputFormulasString, Pair.of(0, 0), material.getFormula().getRawValue());
+ generatePermutations(cleanedMapOfContainedVariables, new ArrayList<>(containedVariables), outputFormulasString, Pair.of(0, 0), material.getFormula().getRawValue());
} catch (NumberFormatException e2) {
LOGGER.debug("Cannot replace variables " + Arrays.toString(variables.toArray()));
diff --git a/src/main/java/org/grobid/core/engines/GrobidPDFEngine.java b/src/main/java/org/grobid/core/engines/GrobidPDFEngine.java
index 2a7c1f99..dfabb7f6 100644
--- a/src/main/java/org/grobid/core/engines/GrobidPDFEngine.java
+++ b/src/main/java/org/grobid/core/engines/GrobidPDFEngine.java
@@ -2,6 +2,7 @@
import com.google.common.collect.Iterables;
import com.google.common.collect.Sets;
+import org.apache.commons.codec.digest.Md5Crypt;
import org.apache.commons.collections4.CollectionUtils;
import org.apache.commons.lang3.RandomStringUtils;
import org.apache.commons.lang3.StringUtils;
@@ -25,11 +26,13 @@
import org.grobid.core.tokenization.TaggingTokenCluster;
import org.grobid.core.tokenization.TaggingTokenClusteror;
import org.grobid.core.utilities.AdditionalLayoutTokensUtil;
+import org.grobid.core.utilities.LayoutTokensUtil;
import org.grobid.core.utilities.OffsetPosition;
import org.grobid.core.utilities.SentenceUtilities;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
+import java.nio.charset.StandardCharsets;
import java.util.*;
import java.util.function.Consumer;
import java.util.stream.Collectors;
@@ -299,7 +302,10 @@ public static BiblioInfo processDocument(Document doc, GrobidAnalysisConfig conf
List documentBlocksBySentences = new ArrayList<>();
documentBlocks.stream().forEach(documentBlock -> {
- String paragraphId = RandomStringUtils.random(10, true, true);
+// String paragraphMd5 = Md5Crypt.md5Crypt(LayoutTokensUtil.toText(documentBlock.getLayoutTokens()).getBytes(StandardCharsets.UTF_8)).substring(0, 10);
+ String paragraphId = RandomStringUtils.random(10, true, true);
List> markersExtremitiesAsIndex = new ArrayList<>();
List markersPositionsAsOffsetsInText = new ArrayList<>();
@@ -314,7 +320,7 @@ public static BiblioInfo processDocument(Document doc, GrobidAnalysisConfig conf
if (!sortedMarkersListByStartOffsets.equals(documentBlock.getMarkers())) {
diff --git a/src/main/java/org/grobid/core/engines/MaterialClassResolver.java b/src/main/java/org/grobid/core/engines/MaterialClassResolver.java
index 3a68a660..6900aefd 100644
--- a/src/main/java/org/grobid/core/engines/MaterialClassResolver.java
+++ b/src/main/java/org/grobid/core/engines/MaterialClassResolver.java
@@ -1,5 +1,6 @@
package org.grobid.core.engines;
+import com.google.inject.Inject;
import com.google.inject.Singleton;
import org.apache.commons.collections4.CollectionUtils;
import org.apache.commons.lang3.StringUtils;
@@ -9,7 +10,6 @@
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
-import javax.inject.Inject;
import java.util.Arrays;
import java.util.Collections;
import java.util.List;
diff --git a/src/main/java/org/grobid/core/engines/MaterialParser.java b/src/main/java/org/grobid/core/engines/MaterialParser.java
index 52ea4700..f50f96db 100644
--- a/src/main/java/org/grobid/core/engines/MaterialParser.java
+++ b/src/main/java/org/grobid/core/engines/MaterialParser.java
@@ -2,6 +2,7 @@
import com.google.common.collect.Iterables;
+import com.google.inject.Inject;
import org.apache.commons.lang3.StringUtils;
import org.apache.commons.lang3.tuple.Pair;
import org.apache.commons.text.StringEscapeUtils;
@@ -12,6 +13,7 @@
import org.grobid.core.data.material.Material;
import org.grobid.core.engines.label.TaggingLabel;
import org.grobid.core.exceptions.GrobidException;
+import org.grobid.core.exceptions.GrobidExceptionStatus;
import org.grobid.core.features.FeaturesVectorMaterial;
import org.grobid.core.layout.BoundingBox;
import org.grobid.core.layout.LayoutToken;
@@ -26,12 +28,10 @@
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
-import javax.inject.Inject;
-import java.util.ArrayList;
-import java.util.Arrays;
-import java.util.List;
+import java.util.*;
import java.util.regex.Pattern;
import java.util.stream.Collectors;
+import java.util.stream.IntStream;
import static org.apache.commons.collections4.CollectionUtils.isEmpty;
import static org.apache.commons.collections4.CollectionUtils.isNotEmpty;
@@ -87,6 +87,84 @@ public List process(String text) {
return process(SuperconductorsParser.textToLayoutTokens(text));
+ public List> processParallel(List texts) {
+ List emptyIndices = IntStream.range(0, texts.size())
+ .filter(i -> StringUtils.isBlank(texts.get(i)))
+ .boxed()
+ .toList();
+ Set emptyIndicesSet = new HashSet<>(emptyIndices);
+ List textsCopy = new ArrayList<>();
+ for (int is = 0; is < texts.size(); is++) {
+ if (!emptyIndices.contains(is)) {
+ textsCopy.add(texts.get(is));
+ }
+ }
+ List> asLayoutTokens = textsCopy.stream()
+ .map(SuperconductorsParser::textToLayoutTokens)
+ .collect(Collectors.toList());
+ List> processed = processParallelLT(asLayoutTokens);
+ emptyIndices.forEach(i -> processed.add(i, new ArrayList<>()));
+ List> output = new ArrayList<>();
+ for (int is = 0; is < texts.size(); is++) {
+ if (!emptyIndices.contains(is)) {
+ output.add(processed.get(is));
+ } else {
+ output.add(new ArrayList<>());
+ }
+ }
+ return output;
+ }
+ public List> processParallelLT(List> layoutTokensBatch) {
+ List> entities = new ArrayList<>();
+ //Normalisation
+ List> normalisedTokens = layoutTokensBatch.stream()
+ .map(SuperconductorsParser::normalizeAndRetokenizeLayoutTokens)
+ .toList();
+ try {
+ List tokensWithFeatures = normalisedTokens.stream().map(nt -> addFeatures(nt) + "\n").toList();
+ String labellingResult = null;
+ try {
+ labellingResult = label(tokensWithFeatures);
+ } catch (Exception e) {
+ throw new GrobidException("CRF labeling for superconductors parsing failed.", e);
+ }
+ List resultingBlocks = Arrays.asList(labellingResult.split("\n\n"));
+ List> localEntities = extractParallelResults(normalisedTokens, resultingBlocks);
+ entities.addAll(localEntities);
+ } catch (Exception e) {
+ throw new GrobidException("An exception occurred while running Grobid.", e);
+ }
+ return entities;
+ }
+ public List> extractParallelResults(List> tokens, List results) {
+ List> spans = new ArrayList<>();
+ if (tokens.size() != results.size()) {
+ throw new GrobidException("One of the text provided is invalid or empty and cannot be tagged. Please provide a clean input.", GrobidExceptionStatus.BAD_INPUT_DATA);
+ }
+ for (int i = 0; i < tokens.size(); i++) {
+ spans.add(extractResults(tokens.get(i), results.get(i)));
+ }
+ return spans;
+ }
public List process(List tokens) {
diff --git a/src/main/java/org/grobid/core/engines/ModuleEngine.java b/src/main/java/org/grobid/core/engines/ModuleEngine.java
index 298cda17..e98bdfda 100644
--- a/src/main/java/org/grobid/core/engines/ModuleEngine.java
+++ b/src/main/java/org/grobid/core/engines/ModuleEngine.java
@@ -1,6 +1,8 @@
package org.grobid.core.engines;
import com.google.common.collect.Iterables;
+import com.google.inject.Inject;
+import com.google.inject.Singleton;
import org.apache.commons.collections4.CollectionUtils;
import org.apache.commons.lang3.StringUtils;
import org.apache.commons.lang3.tuple.ImmutablePair;
@@ -22,8 +24,6 @@
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
-import javax.inject.Inject;
-import javax.inject.Singleton;
import java.io.File;
import java.io.InputStream;
import java.util.*;
diff --git a/src/main/java/org/grobid/core/engines/RuleBasedLinker.java b/src/main/java/org/grobid/core/engines/RuleBasedLinker.java
index 9cd74695..93326e67 100644
--- a/src/main/java/org/grobid/core/engines/RuleBasedLinker.java
+++ b/src/main/java/org/grobid/core/engines/RuleBasedLinker.java
@@ -1,5 +1,6 @@
package org.grobid.core.engines;
+import com.google.inject.Inject;
import com.google.inject.Singleton;
import org.grobid.core.data.document.Link;
import org.grobid.core.data.document.Span;
@@ -9,7 +10,6 @@
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
-import javax.inject.Inject;
import java.util.ArrayList;
import java.util.Arrays;
import java.util.List;
diff --git a/src/main/java/org/grobid/core/engines/SuperconductorsParser.java b/src/main/java/org/grobid/core/engines/SuperconductorsParser.java
index 2930d09e..c2c32cca 100644
--- a/src/main/java/org/grobid/core/engines/SuperconductorsParser.java
+++ b/src/main/java/org/grobid/core/engines/SuperconductorsParser.java
@@ -1,6 +1,8 @@
package org.grobid.core.engines;
import com.google.common.collect.Iterables;
+import com.google.inject.Inject;
+import com.google.inject.Singleton;
import org.apache.commons.collections4.CollectionUtils;
import org.apache.commons.lang3.StringUtils;
import org.apache.commons.lang3.tuple.Pair;
@@ -27,8 +29,6 @@
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
-import javax.inject.Inject;
-import javax.inject.Singleton;
import java.util.*;
import java.util.stream.Collectors;
diff --git a/src/main/java/org/grobid/core/engines/linking/CRFBasedLinker.java b/src/main/java/org/grobid/core/engines/linking/CRFBasedLinker.java
index 7b98e683..1d10ba3e 100644
--- a/src/main/java/org/grobid/core/engines/linking/CRFBasedLinker.java
+++ b/src/main/java/org/grobid/core/engines/linking/CRFBasedLinker.java
@@ -1,6 +1,8 @@
package org.grobid.core.engines.linking;
import com.google.common.collect.Iterables;
+import com.google.inject.Inject;
+import com.google.inject.Singleton;
import org.apache.commons.collections4.CollectionUtils;
import org.apache.commons.lang3.StringUtils;
import org.apache.commons.lang3.tuple.Pair;
@@ -23,8 +25,6 @@
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
-import javax.inject.Inject;
-import javax.inject.Singleton;
import java.util.*;
import java.util.stream.Collectors;
diff --git a/src/main/java/org/grobid/core/engines/linking/EntityLinker_MaterialTcValue.java b/src/main/java/org/grobid/core/engines/linking/EntityLinker_MaterialTcValue.java
index ac19625a..138016a3 100644
--- a/src/main/java/org/grobid/core/engines/linking/EntityLinker_MaterialTcValue.java
+++ b/src/main/java/org/grobid/core/engines/linking/EntityLinker_MaterialTcValue.java
@@ -1,5 +1,7 @@
package org.grobid.core.engines.linking;
+import com.google.inject.Inject;
+import com.google.inject.Singleton;
import org.grobid.core.GrobidModel;
import org.grobid.core.data.document.Span;
import org.grobid.core.engines.AbstractParser;
@@ -10,8 +12,6 @@
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
-import javax.inject.Inject;
-import javax.inject.Singleton;
import java.util.ArrayList;
import java.util.Arrays;
import java.util.List;
diff --git a/src/main/java/org/grobid/core/engines/linking/EntityLinker_TcValueMe_Method.java b/src/main/java/org/grobid/core/engines/linking/EntityLinker_TcValueMe_Method.java
index f4758162..316ac2b1 100644
--- a/src/main/java/org/grobid/core/engines/linking/EntityLinker_TcValueMe_Method.java
+++ b/src/main/java/org/grobid/core/engines/linking/EntityLinker_TcValueMe_Method.java
@@ -1,5 +1,7 @@
package org.grobid.core.engines.linking;
+import com.google.inject.Inject;
+import com.google.inject.Singleton;
import org.grobid.core.GrobidModel;
import org.grobid.core.data.document.Span;
import org.grobid.core.engines.AbstractParser;
@@ -10,8 +12,6 @@
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
-import javax.inject.Inject;
-import javax.inject.Singleton;
import java.util.ArrayList;
import java.util.Arrays;
import java.util.List;
diff --git a/src/main/java/org/grobid/core/engines/linking/EntityLinker_TcValuePressure.java b/src/main/java/org/grobid/core/engines/linking/EntityLinker_TcValuePressure.java
index 1398df07..92779b1e 100644
--- a/src/main/java/org/grobid/core/engines/linking/EntityLinker_TcValuePressure.java
+++ b/src/main/java/org/grobid/core/engines/linking/EntityLinker_TcValuePressure.java
@@ -1,5 +1,7 @@
package org.grobid.core.engines.linking;
+import com.google.inject.Inject;
+import com.google.inject.Singleton;
import org.grobid.core.GrobidModel;
import org.grobid.core.data.document.Span;
import org.grobid.core.engines.AbstractParser;
@@ -10,8 +12,6 @@
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
-import javax.inject.Inject;
-import javax.inject.Singleton;
import java.util.ArrayList;
import java.util.Arrays;
import java.util.List;
diff --git a/src/main/java/org/grobid/core/engines/training/SuperconductorsParserTrainingData.java b/src/main/java/org/grobid/core/engines/training/SuperconductorsParserTrainingData.java
index 34f3831f..994be7d2 100644
--- a/src/main/java/org/grobid/core/engines/training/SuperconductorsParserTrainingData.java
+++ b/src/main/java/org/grobid/core/engines/training/SuperconductorsParserTrainingData.java
@@ -166,6 +166,7 @@ private void createTrainingPDF(File file, String outputDirectory, TrainingOutput
DocumentBlock newDocumentBlock = new DocumentBlock(documentBlock);
+ newDocumentBlock.setGroupId(documentBlock.getGroupId());
diff --git a/src/main/java/org/grobid/core/engines/training/SuperconductorsTrainingXMLFormatter.java b/src/main/java/org/grobid/core/engines/training/SuperconductorsTrainingXMLFormatter.java
index 6d06987d..4b113755 100644
--- a/src/main/java/org/grobid/core/engines/training/SuperconductorsTrainingXMLFormatter.java
+++ b/src/main/java/org/grobid/core/engines/training/SuperconductorsTrainingXMLFormatter.java
@@ -35,20 +35,31 @@ public String format(List documentBlocks, int id) {
Element body = teiElement("body");
+// Map> byParagraphs = documentBlocks.stream()
+// .collect(Collectors.groupingBy(DocumentBlock::getParagraphId));
+ String previousParagraphId = null;
+ String previousSection = "NO_SECTION";
+ Element previousParent = null;
+ Element parent = null;
for (DocumentBlock block : documentBlocks) {
+ String paragraphId = block.getGroupId();
if (block.getSection().equals(DocumentBlock.SECTION_BODY)) {
if (block.getSubSection().equals(DocumentBlock.SUB_SECTION_FIGURE)) {
- body.appendChild(trainingExtraction(block.getSpans(),
- block.getLayoutTokens(), "ab", Pair.of("type", "figureCaption")));
+ parent = getParentElement(body, previousParagraphId, paragraphId, previousParent, "ab", Pair.of("type", "figureCaption"));
+ parent.appendChild(trainingExtraction(block.getSpans(), block.getLayoutTokens(), "s"));
} else if (block.getSubSection().equals(DocumentBlock.SUB_SECTION_TABLE)) {
- body.appendChild(trainingExtraction(block.getSpans(),
- block.getLayoutTokens(), "ab", Pair.of("type", "tableCaption")));
+ parent = getParentElement(body, previousParagraphId, paragraphId, previousParent, "ab", Pair.of("type", "tableCaption"));
+ parent.appendChild(trainingExtraction(block.getSpans(), block.getLayoutTokens(), "s"));
} else if (block.getSubSection().equals(DocumentBlock.SUB_SECTION_PARAGRAPH)) {
- body.appendChild(trainingExtraction(block.getSpans(), block.getLayoutTokens()));
+ parent = getParentElement(body, previousParagraphId, paragraphId, previousParent, "p", null);
+ parent.appendChild(trainingExtraction(block.getSpans(), block.getLayoutTokens(), "s"));
} else if (block.getSubSection().equals(DocumentBlock.SUB_SECTION_TITLE_SECTION)) {
- body.appendChild(trainingExtraction(block.getSpans(), block.getLayoutTokens(), "head"));
+ parent = getParentElement(body, previousParagraphId, paragraphId, previousParent, "head", null);
+ parent.appendChild(trainingExtraction(block.getSpans(), block.getLayoutTokens(), "s"));
} else {
- body.appendChild(trainingExtraction(block.getSpans(), block.getLayoutTokens()));
+ parent = getParentElement(body, previousParagraphId, paragraphId, previousParent, "p", null);
+ parent.appendChild(trainingExtraction(block.getSpans(), block.getLayoutTokens(), "s"));
} else if (block.getSection().equals(DocumentBlock.SECTION_HEADER)) {
if (block.getSubSection().equals(DocumentBlock.SUB_SECTION_TITLE)) {
@@ -65,25 +76,33 @@ public String format(List documentBlocks, int id) {
throw new RuntimeException("new keywords, but no space for them... ");
} else if (block.getSubSection().equals(DocumentBlock.SUB_SECTION_ABSTRACT)) {
Element abstractElement = SuperconductorsTeiUtils.getElement(profileDesc, "abstract");
if (abstractElement == null) {
abstractElement = teiElement("abstract");
- abstractElement.appendChild(trainingExtraction(block.getSpans(), block.getLayoutTokens()));
+ parent = getParentElement(abstractElement, previousParagraphId, paragraphId, previousParent, "p", null);
+ parent.appendChild(trainingExtraction(block.getSpans(), block.getLayoutTokens(), "s"));
} else {
throw new RuntimeException("The section or subsection have the wrong name. " +
"This will cause loss of data in the output generated files. Section name: " + block.getSection() +
", " + block.getSubSection());
} else if (block.getSection().equals(DocumentBlock.SECTION_ANNEX)) {
- body.appendChild(trainingExtraction(block.getSpans(), block.getLayoutTokens()));
+ if (!StringUtils.equals(paragraphId, previousParagraphId)) {
+ parent = teiElement("p");
+ body.appendChild(parent);
+ } else {
+ parent = previousParent;
+ }
+ parent.appendChild(trainingExtraction(block.getSpans(), block.getLayoutTokens()));
} else {
throw new RuntimeException("The section or subsection have the wrong name. " +
"This will cause loss of data in the output generated files. Section name: " + block.getSection() +
", " + block.getSubSection());
+ previousParent = parent;
+ previousParagraphId = paragraphId;
@@ -91,6 +110,26 @@ public String format(List documentBlocks, int id) {
return XmlBuilderUtils.toXml(outputDocumentRoot);
+ /**
+ * Create the parent element or, if under certain conditions, recycle the previous one.
+ */
+ protected Element getParentElement(Element body, String previousParagraphId, String paragraphId, Element previousParent, String parentTagName, Pair attributes) {
+ Element parent = null;
+ if (previousParent == null || !StringUtils.equals(paragraphId, previousParagraphId)) {
+ parent = teiElement(parentTagName);
+ if (attributes != null) {
+ parent.addAttribute(new Attribute(attributes.getLeft(), attributes.getRight()));
+ }
+ body.appendChild(parent);
+ } else {
+ parent = previousParent;
+ }
+ return parent;
+ }
protected Element trainingExtraction(List spanList, List tokens) {
return trainingExtraction(spanList, tokens, "p");
@@ -125,7 +164,7 @@ protected Element trainingExtraction(List spanList, List toke
// We stop the process if something doesn't match
- int accumulatedOffset = startPosition + length(contentBefore) + length(name);
+ int accumulatedOffset = startPosition + length(contentBefore) + LayoutTokensUtil.toText(superconductor.getLayoutTokens()).stripTrailing().length();
if (end != accumulatedOffset) {
throw new RuntimeException("Wrong synchronisation between entities and layout tokens. End entity offset: " + end
+ " different from the expected offset: " + accumulatedOffset);
diff --git a/src/main/java/org/grobid/core/utilities/client/ChemDataExtractorClient.java b/src/main/java/org/grobid/core/utilities/client/ChemDataExtractorClient.java
index 343aa4a4..76b9a0f5 100644
--- a/src/main/java/org/grobid/core/utilities/client/ChemDataExtractorClient.java
+++ b/src/main/java/org/grobid/core/utilities/client/ChemDataExtractorClient.java
@@ -6,6 +6,8 @@
import com.fasterxml.jackson.databind.DeserializationFeature;
import com.fasterxml.jackson.databind.JsonMappingException;
import com.fasterxml.jackson.databind.ObjectMapper;
+import com.google.inject.Inject;
+import com.google.inject.Singleton;
import org.apache.http.HttpEntity;
import org.apache.http.client.methods.CloseableHttpResponse;
import org.apache.http.client.methods.HttpPost;
@@ -17,8 +19,6 @@
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
-import javax.inject.Inject;
-import javax.inject.Singleton;
import java.io.IOException;
import java.io.InputStream;
import java.net.ConnectException;
@@ -28,7 +28,7 @@
import java.util.List;
import java.util.stream.Collectors;
-import static javax.ws.rs.core.MediaType.APPLICATION_JSON;
+import static jakarta.ws.rs.core.MediaType.APPLICATION_JSON;
import static org.grobid.core.utilities.client.LinkingModuleClient.toJson_listOfString;
diff --git a/src/main/java/org/grobid/core/utilities/client/ChemicalMaterialParserClient.java b/src/main/java/org/grobid/core/utilities/client/ChemicalMaterialParserClient.java
index 49e48857..cb711124 100644
--- a/src/main/java/org/grobid/core/utilities/client/ChemicalMaterialParserClient.java
+++ b/src/main/java/org/grobid/core/utilities/client/ChemicalMaterialParserClient.java
@@ -6,6 +6,8 @@
import com.fasterxml.jackson.databind.DeserializationFeature;
import com.fasterxml.jackson.databind.JsonMappingException;
import com.fasterxml.jackson.databind.ObjectMapper;
+import com.google.inject.Inject;
+import com.google.inject.Singleton;
import org.apache.http.HttpEntity;
import org.apache.http.client.methods.CloseableHttpResponse;
import org.apache.http.client.methods.HttpPost;
@@ -18,8 +20,6 @@
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
-import javax.inject.Inject;
-import javax.inject.Singleton;
import java.io.IOException;
import java.io.InputStream;
import java.net.HttpURLConnection;
@@ -27,7 +27,7 @@
import java.nio.charset.StandardCharsets;
import java.util.List;
-import static javax.ws.rs.core.MediaType.APPLICATION_JSON;
+import static jakarta.ws.rs.core.MediaType.APPLICATION_JSON;
public class ChemicalMaterialParserClient {
@@ -66,10 +66,16 @@ public ChemicalComposition convertNameToFormula(String name) {
try (CloseableHttpResponse response = httpClient.execute(request)) {
int statusCode = response.getStatusLine().getStatusCode();
- if (statusCode == HttpURLConnection.HTTP_OK) {
- outputFormula = fromJsonToChemicalComposition(response.getEntity().getContent());
+ if (statusCode != HttpURLConnection.HTTP_OK) {
+ LOGGER.debug("Not OK answer. Input: " + name + ". Status code: " + response.getStatusLine().getStatusCode());
} else {
- LOGGER.debug("Not OK answer. Input: " + name + ", status code: " + statusCode);
+ outputFormula = fromJsonToChemicalComposition(response.getEntity().getContent());
+ if (outputFormula != null && outputFormula.getCode() != HttpURLConnection.HTTP_OK) {
+ LOGGER.debug("Not OK answer. Input: " + name + ". " +
+ "Status code: " + outputFormula.getCode() +
+ "Message: " + outputFormula.getMessage());
+ outputFormula = new ChemicalComposition();
+ }
@@ -101,6 +107,11 @@ public ChemicalComposition convertFormulaToComposition(String formula) {
LOGGER.debug("Not OK answer. Input: " + formula + ". Status code: " + response.getStatusLine().getStatusCode());
} else {
outputComposition = fromJsonToChemicalComposition(response.getEntity().getContent());
+ if (outputComposition != null && outputComposition.getCode() != HttpURLConnection.HTTP_OK) {
+ LOGGER.debug("Not OK answer. Input: " + formula + ". Status code: " + outputComposition.getCode() +
+ "Message: " + outputComposition.getMessage());
+ outputComposition = new ChemicalComposition();
+ }
diff --git a/src/main/java/org/grobid/core/utilities/client/ChemspotClient.java b/src/main/java/org/grobid/core/utilities/client/ChemspotClient.java
index 0a375d3e..58599865 100644
--- a/src/main/java/org/grobid/core/utilities/client/ChemspotClient.java
+++ b/src/main/java/org/grobid/core/utilities/client/ChemspotClient.java
@@ -6,6 +6,8 @@
import com.fasterxml.jackson.databind.DeserializationFeature;
import com.fasterxml.jackson.databind.JsonMappingException;
import com.fasterxml.jackson.databind.ObjectMapper;
+import com.google.inject.Inject;
+import com.google.inject.Singleton;
import org.apache.http.HttpEntity;
import org.apache.http.client.methods.CloseableHttpResponse;
import org.apache.http.client.methods.HttpPost;
@@ -17,8 +19,6 @@
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
-import javax.inject.Inject;
-import javax.inject.Singleton;
import java.io.IOException;
import java.io.InputStream;
import java.net.HttpURLConnection;
@@ -26,7 +26,8 @@
import java.util.ArrayList;
import java.util.List;
-import static javax.ws.rs.core.MediaType.APPLICATION_JSON;
+import static jakarta.ws.rs.core.MediaType.APPLICATION_JSON;
public class ChemspotClient {
diff --git a/src/main/java/org/grobid/core/utilities/client/ClassResolverModuleClient.java b/src/main/java/org/grobid/core/utilities/client/ClassResolverModuleClient.java
index ef58bff6..0fcc12df 100644
--- a/src/main/java/org/grobid/core/utilities/client/ClassResolverModuleClient.java
+++ b/src/main/java/org/grobid/core/utilities/client/ClassResolverModuleClient.java
@@ -6,6 +6,8 @@
import com.fasterxml.jackson.databind.DeserializationFeature;
import com.fasterxml.jackson.databind.JsonMappingException;
import com.fasterxml.jackson.databind.ObjectMapper;
+import com.google.inject.Inject;
+import com.google.inject.Singleton;
import org.apache.http.HttpEntity;
import org.apache.http.client.methods.CloseableHttpResponse;
import org.apache.http.client.methods.HttpPost;
@@ -17,8 +19,6 @@
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
-import javax.inject.Inject;
-import javax.inject.Singleton;
import java.io.IOException;
import java.io.InputStream;
import java.net.HttpURLConnection;
@@ -27,7 +27,7 @@
import java.util.ArrayList;
import java.util.List;
-import static javax.ws.rs.core.MediaType.APPLICATION_JSON;
+import static jakarta.ws.rs.core.MediaType.APPLICATION_JSON;
public class ClassResolverModuleClient {
diff --git a/src/main/java/org/grobid/core/utilities/client/GrobidQuantitiesClient.java b/src/main/java/org/grobid/core/utilities/client/GrobidQuantitiesClient.java
index d1ca01a4..6f1e1b85 100644
--- a/src/main/java/org/grobid/core/utilities/client/GrobidQuantitiesClient.java
+++ b/src/main/java/org/grobid/core/utilities/client/GrobidQuantitiesClient.java
@@ -5,6 +5,8 @@
import com.fasterxml.jackson.databind.DeserializationFeature;
import com.fasterxml.jackson.databind.JsonMappingException;
import com.fasterxml.jackson.databind.ObjectMapper;
+import com.google.inject.Inject;
+import com.google.inject.Singleton;
import org.apache.http.Consts;
import org.apache.http.NameValuePair;
import org.apache.http.client.entity.UrlEncodedFormEntity;
@@ -17,8 +19,6 @@
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
-import javax.inject.Inject;
-import javax.inject.Singleton;
import java.io.IOException;
import java.io.InputStream;
import java.net.HttpURLConnection;
@@ -27,8 +27,9 @@
import java.util.LinkedHashMap;
import java.util.List;
-import static javax.ws.rs.core.MediaType.APPLICATION_FORM_URLENCODED;
-import static javax.ws.rs.core.MediaType.APPLICATION_JSON;
+import static jakarta.ws.rs.core.MediaType.APPLICATION_FORM_URLENCODED;
+import static jakarta.ws.rs.core.MediaType.APPLICATION_JSON;
public class GrobidQuantitiesClient {
diff --git a/src/main/java/org/grobid/core/utilities/client/LinkingModuleClient.java b/src/main/java/org/grobid/core/utilities/client/LinkingModuleClient.java
index 2dd1ee39..b69d6b39 100644
--- a/src/main/java/org/grobid/core/utilities/client/LinkingModuleClient.java
+++ b/src/main/java/org/grobid/core/utilities/client/LinkingModuleClient.java
@@ -6,6 +6,8 @@
import com.fasterxml.jackson.databind.DeserializationFeature;
import com.fasterxml.jackson.databind.JsonMappingException;
import com.fasterxml.jackson.databind.ObjectMapper;
+import com.google.inject.Inject;
+import com.google.inject.Singleton;
import org.apache.http.HttpEntity;
import org.apache.http.client.methods.CloseableHttpResponse;
import org.apache.http.client.methods.HttpPost;
@@ -18,8 +20,6 @@
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
-import javax.inject.Inject;
-import javax.inject.Singleton;
import java.io.IOException;
import java.io.InputStream;
import java.net.HttpURLConnection;
@@ -27,7 +27,8 @@
import java.nio.charset.StandardCharsets;
import java.util.List;
-import static javax.ws.rs.core.MediaType.APPLICATION_JSON;
+import static jakarta.ws.rs.core.MediaType.APPLICATION_JSON;
public class LinkingModuleClient {
diff --git a/src/main/java/org/grobid/core/utilities/client/StructureIdentificationModuleClient.java b/src/main/java/org/grobid/core/utilities/client/StructureIdentificationModuleClient.java
index 3a6a62ce..3b4ca914 100644
--- a/src/main/java/org/grobid/core/utilities/client/StructureIdentificationModuleClient.java
+++ b/src/main/java/org/grobid/core/utilities/client/StructureIdentificationModuleClient.java
@@ -6,6 +6,8 @@
import com.fasterxml.jackson.databind.DeserializationFeature;
import com.fasterxml.jackson.databind.JsonMappingException;
import com.fasterxml.jackson.databind.ObjectMapper;
+import com.google.inject.Inject;
+import com.google.inject.Singleton;
import org.apache.http.HttpEntity;
import org.apache.http.client.methods.CloseableHttpResponse;
import org.apache.http.client.methods.HttpPost;
@@ -18,8 +20,6 @@
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
-import javax.inject.Inject;
-import javax.inject.Singleton;
import java.io.IOException;
import java.io.InputStream;
import java.net.HttpURLConnection;
@@ -28,7 +28,7 @@
import java.util.ArrayList;
import java.util.List;
-import static javax.ws.rs.core.MediaType.APPLICATION_JSON;
+import static jakarta.ws.rs.core.MediaType.APPLICATION_JSON;
public class StructureIdentificationModuleClient {
diff --git a/src/main/java/org/grobid/service/EmptyOptionalNoContentExceptionMapper.java b/src/main/java/org/grobid/service/EmptyOptionalNoContentExceptionMapper.java
index d81ef81a..7fafdfce 100644
--- a/src/main/java/org/grobid/service/EmptyOptionalNoContentExceptionMapper.java
+++ b/src/main/java/org/grobid/service/EmptyOptionalNoContentExceptionMapper.java
@@ -2,9 +2,9 @@
import io.dropwizard.jersey.optional.EmptyOptionalException;
import io.dropwizard.jersey.optional.EmptyOptionalExceptionMapper;
+import jakarta.ws.rs.core.Response;
+import jakarta.ws.rs.ext.ExceptionMapper;
-import javax.ws.rs.core.Response;
-import javax.ws.rs.ext.ExceptionMapper;
* Returns a 204 for Optional.empty()
diff --git a/src/main/java/org/grobid/service/GrobidEngineInitialiser.java b/src/main/java/org/grobid/service/GrobidEngineInitialiser.java
index db08eb96..f7c4018d 100644
--- a/src/main/java/org/grobid/service/GrobidEngineInitialiser.java
+++ b/src/main/java/org/grobid/service/GrobidEngineInitialiser.java
@@ -1,6 +1,8 @@
package org.grobid.service;
import com.google.common.collect.ImmutableList;
+import com.google.inject.Inject;
+import com.google.inject.Singleton;
import org.apache.commons.lang3.StringUtils;
import org.grobid.core.main.GrobidHomeFinder;
import org.grobid.core.main.LibraryLoader;
@@ -10,8 +12,6 @@
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
-import javax.inject.Inject;
-import javax.inject.Singleton;
import java.lang.reflect.Field;
diff --git a/src/main/java/org/grobid/service/GrobidSuperconductorsApplication.java b/src/main/java/org/grobid/service/GrobidSuperconductorsApplication.java
index 7c9c6ac3..9e3528d1 100755
--- a/src/main/java/org/grobid/service/GrobidSuperconductorsApplication.java
+++ b/src/main/java/org/grobid/service/GrobidSuperconductorsApplication.java
@@ -1,25 +1,22 @@
package org.grobid.service;
-import com.google.inject.Module;
-import com.hubspot.dropwizard.guicier.GuiceBundle;
-import io.dropwizard.Application;
+import com.google.inject.AbstractModule;
import io.dropwizard.assets.AssetsBundle;
import io.dropwizard.configuration.EnvironmentVariableSubstitutor;
import io.dropwizard.configuration.SubstitutingSourceProvider;
+import io.dropwizard.core.Application;
+import io.dropwizard.core.setup.Bootstrap;
+import io.dropwizard.core.setup.Environment;
import io.dropwizard.forms.MultiPartBundle;
-import io.dropwizard.setup.Bootstrap;
-import io.dropwizard.setup.Environment;
+import jakarta.servlet.DispatcherType;
+import jakarta.servlet.FilterRegistration;
import org.eclipse.jetty.servlets.CrossOriginFilter;
-import org.eclipse.jetty.servlets.DoSFilter;
import org.eclipse.jetty.servlets.QoSFilter;
import org.grobid.service.command.*;
import org.grobid.service.configuration.GrobidSuperconductorsConfiguration;
+import ru.vyarus.dropwizard.guice.GuiceBundle;
-import javax.servlet.DispatcherType;
-import javax.servlet.FilterRegistration;
-import java.util.Arrays;
import java.util.EnumSet;
-import java.util.List;
public class GrobidSuperconductorsApplication extends Application {
private static final String RESOURCES = "/service";
@@ -33,8 +30,8 @@ public String getName() {
return "grobid-superconductors";
- private List extends Module> getGuiceModules() {
- return Arrays.asList(new SuperconductorsServiceModule());
+ private AbstractModule getGuiceModules() {
+ return new SuperconductorsServiceModule();
@@ -42,9 +39,10 @@ public void initialize(Bootstrap bootstrap)
bootstrap.setConfigurationSourceProvider(new SubstitutingSourceProvider(
bootstrap.getConfigurationSourceProvider(), new EnvironmentVariableSubstitutor(false)));
- GuiceBundle guiceBundle = GuiceBundle.defaultBuilder(GrobidSuperconductorsConfiguration.class)
+ GuiceBundle guiceBundle = GuiceBundle.builder()
bootstrap.addBundle(new MultiPartBundle());
bootstrap.addBundle(new AssetsBundle("/web", "/", "index.html", "assets"));
diff --git a/src/main/java/org/grobid/service/SuperconductorsServiceModule.java b/src/main/java/org/grobid/service/SuperconductorsServiceModule.java
index b9bdc522..b16280c0 100644
--- a/src/main/java/org/grobid/service/SuperconductorsServiceModule.java
+++ b/src/main/java/org/grobid/service/SuperconductorsServiceModule.java
@@ -1,10 +1,8 @@
package org.grobid.service;
-import com.codahale.metrics.MetricRegistry;
-import com.fasterxml.jackson.databind.ObjectMapper;
-import com.google.inject.Binder;
import com.google.inject.Provides;
-import com.hubspot.dropwizard.guicier.DropwizardAwareModule;
+import jakarta.ws.rs.client.Client;
+import jakarta.ws.rs.client.ClientBuilder;
import org.grobid.core.engines.*;
import org.grobid.core.engines.linking.CRFBasedLinker;
import org.grobid.core.utilities.client.*;
@@ -14,59 +12,42 @@
import org.grobid.service.exceptions.mapper.GrobidExceptionsTranslationUtility;
import org.grobid.service.exceptions.mapper.GrobidServiceExceptionMapper;
import org.grobid.service.exceptions.mapper.WebApplicationExceptionMapper;
-import javax.ws.rs.client.Client;
-import javax.ws.rs.client.ClientBuilder;
+import ru.vyarus.dropwizard.guice.module.support.DropwizardAwareModule;
public class SuperconductorsServiceModule extends DropwizardAwareModule {
- public void configure(Binder binder) {
+ public void configure() {
// Generic modules
- binder.bind(GrobidEngineInitialiser.class);
- binder.bind(HealthCheck.class);
+ bind(GrobidEngineInitialiser.class);
+ bind(HealthCheck.class);
//Core services
- binder.bind(ChemspotClient.class);
- binder.bind(ChemDataExtractorClient.class);
- binder.bind(StructureIdentificationModuleClient.class);
- binder.bind(ClassResolverModuleClient.class);
- binder.bind(MaterialClassResolver.class);
- binder.bind(ChemicalMaterialParserClient.class);
- binder.bind(MaterialParser.class);
- binder.bind(LinkingModuleClient.class);
- binder.bind(RuleBasedLinker.class);
- binder.bind(CRFBasedLinker.class);
- binder.bind(SuperconductorsParser.class);
- binder.bind(ModuleEngine.class);
+ bind(ChemspotClient.class);
+ bind(ChemDataExtractorClient.class);
+ bind(StructureIdentificationModuleClient.class);
+ bind(ClassResolverModuleClient.class);
+ bind(MaterialClassResolver.class);
+ bind(ChemicalMaterialParserClient.class);
+ bind(MaterialParser.class);
+ bind(LinkingModuleClient.class);
+ bind(RuleBasedLinker.class);
+ bind(CRFBasedLinker.class);
+ bind(SuperconductorsParser.class);
+ bind(ModuleEngine.class);
- binder.bind(AnnotationController.class);
- binder.bind(MaterialController.class);
- binder.bind(LinkerController.class);
- binder.bind(ServiceController.class);
+ bind(AnnotationController.class);
+ bind(MaterialController.class);
+ bind(LinkerController.class);
+ bind(ServiceController.class);
//Exception Mappers
- binder.bind(GrobidServiceExceptionMapper.class);
- binder.bind(GrobidExceptionsTranslationUtility.class);
- binder.bind(GrobidExceptionMapper.class);
- binder.bind(WebApplicationExceptionMapper.class);
- }
- @Provides
- protected ObjectMapper getObjectMapper() {
- return getEnvironment().getObjectMapper();
- }
- @Provides
- protected MetricRegistry provideMetricRegistry() {
- return getMetricRegistry();
- }
- //for unit tests
- protected MetricRegistry getMetricRegistry() {
- return getEnvironment().metrics();
+ bind(GrobidServiceExceptionMapper.class);
+ bind(GrobidExceptionsTranslationUtility.class);
+ bind(GrobidExceptionMapper.class);
+ bind(WebApplicationExceptionMapper.class);
diff --git a/src/main/java/org/grobid/service/command/InterAnnotationAgreementCommand.java b/src/main/java/org/grobid/service/command/InterAnnotationAgreementCommand.java
index 2351e268..19db78d8 100644
--- a/src/main/java/org/grobid/service/command/InterAnnotationAgreementCommand.java
+++ b/src/main/java/org/grobid/service/command/InterAnnotationAgreementCommand.java
@@ -1,7 +1,7 @@
package org.grobid.service.command;
-import io.dropwizard.cli.ConfiguredCommand;
-import io.dropwizard.setup.Bootstrap;
+import io.dropwizard.core.cli.ConfiguredCommand;
+import io.dropwizard.core.setup.Bootstrap;
import net.sourceforge.argparse4j.impl.Arguments;
import net.sourceforge.argparse4j.inf.Namespace;
import net.sourceforge.argparse4j.inf.Subparser;
diff --git a/src/main/java/org/grobid/service/command/PrepareDelftTrainingCommand.java b/src/main/java/org/grobid/service/command/PrepareDelftTrainingCommand.java
index 3af119ea..df0828a1 100644
--- a/src/main/java/org/grobid/service/command/PrepareDelftTrainingCommand.java
+++ b/src/main/java/org/grobid/service/command/PrepareDelftTrainingCommand.java
@@ -1,7 +1,7 @@
package org.grobid.service.command;
-import io.dropwizard.cli.ConfiguredCommand;
-import io.dropwizard.setup.Bootstrap;
+import io.dropwizard.core.cli.ConfiguredCommand;
+import io.dropwizard.core.setup.Bootstrap;
import net.sourceforge.argparse4j.impl.Arguments;
import net.sourceforge.argparse4j.inf.MutuallyExclusiveGroup;
import net.sourceforge.argparse4j.inf.Namespace;
diff --git a/src/main/java/org/grobid/service/command/PrepareMaterialParserTrainingCommand.java b/src/main/java/org/grobid/service/command/PrepareMaterialParserTrainingCommand.java
index 1ab48bfa..b7944cfa 100644
--- a/src/main/java/org/grobid/service/command/PrepareMaterialParserTrainingCommand.java
+++ b/src/main/java/org/grobid/service/command/PrepareMaterialParserTrainingCommand.java
@@ -1,7 +1,7 @@
package org.grobid.service.command;
-import io.dropwizard.cli.ConfiguredCommand;
-import io.dropwizard.setup.Bootstrap;
+import io.dropwizard.core.cli.ConfiguredCommand;
+import io.dropwizard.core.setup.Bootstrap;
import net.sourceforge.argparse4j.impl.Arguments;
import net.sourceforge.argparse4j.inf.Namespace;
import net.sourceforge.argparse4j.inf.Subparser;
diff --git a/src/main/java/org/grobid/service/command/RunTrainingCommand.java b/src/main/java/org/grobid/service/command/RunTrainingCommand.java
index fedc4cdb..4998b75d 100644
--- a/src/main/java/org/grobid/service/command/RunTrainingCommand.java
+++ b/src/main/java/org/grobid/service/command/RunTrainingCommand.java
@@ -1,7 +1,7 @@
package org.grobid.service.command;
-import io.dropwizard.cli.ConfiguredCommand;
-import io.dropwizard.setup.Bootstrap;
+import io.dropwizard.core.cli.ConfiguredCommand;
+import io.dropwizard.core.setup.Bootstrap;
import net.sourceforge.argparse4j.inf.Namespace;
import net.sourceforge.argparse4j.inf.Subparser;
import org.grobid.core.engines.SuperconductorsModels;
diff --git a/src/main/java/org/grobid/service/command/TrainingGenerationCommand.java b/src/main/java/org/grobid/service/command/TrainingGenerationCommand.java
index 67e681fd..359707d1 100644
--- a/src/main/java/org/grobid/service/command/TrainingGenerationCommand.java
+++ b/src/main/java/org/grobid/service/command/TrainingGenerationCommand.java
@@ -1,7 +1,7 @@
package org.grobid.service.command;
-import io.dropwizard.cli.ConfiguredCommand;
-import io.dropwizard.setup.Bootstrap;
+import io.dropwizard.core.cli.ConfiguredCommand;
+import io.dropwizard.core.setup.Bootstrap;
import net.sourceforge.argparse4j.impl.Arguments;
import net.sourceforge.argparse4j.inf.Namespace;
import net.sourceforge.argparse4j.inf.Subparser;
diff --git a/src/main/java/org/grobid/service/configuration/GrobidSuperconductorsConfiguration.java b/src/main/java/org/grobid/service/configuration/GrobidSuperconductorsConfiguration.java
index 12c20dd0..4f5bf679 100755
--- a/src/main/java/org/grobid/service/configuration/GrobidSuperconductorsConfiguration.java
+++ b/src/main/java/org/grobid/service/configuration/GrobidSuperconductorsConfiguration.java
@@ -1,12 +1,12 @@
package org.grobid.service.configuration;
import com.fasterxml.jackson.annotation.JsonProperty;
-import io.dropwizard.Configuration;
+import io.dropwizard.core.Configuration;
import org.apache.commons.io.IOUtils;
-import org.grobid.core.utilities.GrobidConfig;
-import org.grobid.core.utilities.GrobidProperties;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
+import org.grobid.core.utilities.GrobidConfig;
+import org.grobid.core.utilities.GrobidProperties;
import java.io.IOException;
import java.io.InputStream;
diff --git a/src/main/java/org/grobid/service/controller/AnnotationController.java b/src/main/java/org/grobid/service/controller/AnnotationController.java
index 81966d42..750175b7 100644
--- a/src/main/java/org/grobid/service/controller/AnnotationController.java
+++ b/src/main/java/org/grobid/service/controller/AnnotationController.java
@@ -1,5 +1,7 @@
package org.grobid.service.controller;
+import com.google.inject.Inject;
+import com.google.inject.Singleton;
import org.apache.commons.collections4.CollectionUtils;
import org.apache.commons.lang3.StringUtils;
import org.glassfish.jersey.media.multipart.FormDataContentDisposition;
@@ -12,10 +14,8 @@
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
-import javax.inject.Inject;
-import javax.inject.Singleton;
-import javax.ws.rs.*;
-import javax.ws.rs.core.MediaType;
+import jakarta.ws.rs.*;
+import jakarta.ws.rs.core.MediaType;
import java.io.InputStream;
import java.util.ArrayList;
import java.util.List;
diff --git a/src/main/java/org/grobid/service/controller/HealthCheck.java b/src/main/java/org/grobid/service/controller/HealthCheck.java
index 83851406..202b6612 100644
--- a/src/main/java/org/grobid/service/controller/HealthCheck.java
+++ b/src/main/java/org/grobid/service/controller/HealthCheck.java
@@ -1,15 +1,16 @@
package org.grobid.service.controller;
+import com.google.inject.Inject;
+import com.google.inject.Singleton;
import org.grobid.service.configuration.GrobidSuperconductorsConfiguration;
-import javax.inject.Inject;
-import javax.inject.Singleton;
-import javax.ws.rs.GET;
-import javax.ws.rs.Path;
-import javax.ws.rs.Produces;
-import javax.ws.rs.core.Response;
-import static javax.ws.rs.core.MediaType.APPLICATION_JSON;
+import jakarta.ws.rs.GET;
+import jakarta.ws.rs.Path;
+import jakarta.ws.rs.Produces;
+import jakarta.ws.rs.core.Response;
+import static jakarta.ws.rs.core.MediaType.APPLICATION_JSON;
diff --git a/src/main/java/org/grobid/service/controller/LinkerController.java b/src/main/java/org/grobid/service/controller/LinkerController.java
index 218ea02f..c982a1e2 100644
--- a/src/main/java/org/grobid/service/controller/LinkerController.java
+++ b/src/main/java/org/grobid/service/controller/LinkerController.java
@@ -1,6 +1,8 @@
package org.grobid.service.controller;
import com.ctc.wstx.stax.WstxInputFactory;
+import com.google.inject.Inject;
+import com.google.inject.Singleton;
import org.apache.commons.lang3.tuple.Pair;
import org.codehaus.stax2.XMLStreamReader2;
import org.glassfish.jersey.media.multipart.FormDataParam;
@@ -14,14 +16,12 @@
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
-import javax.inject.Inject;
-import javax.inject.Singleton;
-import javax.ws.rs.GET;
-import javax.ws.rs.POST;
-import javax.ws.rs.Path;
-import javax.ws.rs.Produces;
-import javax.ws.rs.core.MediaType;
-import javax.ws.rs.core.Response;
+import jakarta.ws.rs.GET;
+import jakarta.ws.rs.POST;
+import jakarta.ws.rs.Path;
+import jakarta.ws.rs.Produces;
+import jakarta.ws.rs.core.MediaType;
+import jakarta.ws.rs.core.Response;
import javax.xml.stream.XMLStreamException;
import java.io.ByteArrayInputStream;
import java.io.InputStream;
diff --git a/src/main/java/org/grobid/service/controller/MaterialController.java b/src/main/java/org/grobid/service/controller/MaterialController.java
index c9155478..dfbdf309 100644
--- a/src/main/java/org/grobid/service/controller/MaterialController.java
+++ b/src/main/java/org/grobid/service/controller/MaterialController.java
@@ -1,17 +1,18 @@
package org.grobid.service.controller;
+import com.google.inject.Inject;
+import com.google.inject.Singleton;
+import jakarta.ws.rs.GET;
+import jakarta.ws.rs.POST;
+import jakarta.ws.rs.Path;
+import jakarta.ws.rs.Produces;
+import jakarta.ws.rs.core.MediaType;
import org.glassfish.jersey.media.multipart.FormDataParam;
import org.grobid.core.data.material.Material;
import org.grobid.core.engines.MaterialParser;
import org.grobid.service.configuration.GrobidSuperconductorsConfiguration;
-import javax.inject.Inject;
-import javax.inject.Singleton;
-import javax.ws.rs.GET;
-import javax.ws.rs.POST;
-import javax.ws.rs.Path;
-import javax.ws.rs.Produces;
-import javax.ws.rs.core.MediaType;
+import java.util.Arrays;
import java.util.List;
@@ -42,10 +43,32 @@ public List processTextSuperconductorsGet(@FormDataParam("text") Strin
return parseMaterial(text);
+ @Path("multiparse")
+ @Produces(MediaType.APPLICATION_JSON)
+ public List> processTextSuperconductorsPost2(@FormDataParam("texts") String texts) {
+ return parseMaterials(texts);
+ }
+ @Path("multiparse")
+ @Produces(MediaType.APPLICATION_JSON)
+ @GET
+ public List> processTextSuperconductorsGet2(@FormDataParam("texts") String texts) {
+ return parseMaterials(texts);
+ }
private List parseMaterial(@FormDataParam("text") String text) {
String textPreprocessed = text.replace("\r\n", "\n");
return materialParser.process(textPreprocessed);
+ private List> parseMaterials(@FormDataParam("text") String text) {
+ String textPreprocessed = text.replace("\r\n", "\n");
+ List list = Arrays.asList(textPreprocessed.split("\n"));
+ return materialParser.processParallel(list);
+ }
diff --git a/src/main/java/org/grobid/service/controller/ServiceController.java b/src/main/java/org/grobid/service/controller/ServiceController.java
index 17fbfee9..92a0584e 100644
--- a/src/main/java/org/grobid/service/controller/ServiceController.java
+++ b/src/main/java/org/grobid/service/controller/ServiceController.java
@@ -1,14 +1,14 @@
package org.grobid.service.controller;
+import com.google.inject.Inject;
+import com.google.inject.Singleton;
import org.grobid.core.data.ServiceInfo;
import org.grobid.service.configuration.GrobidSuperconductorsConfiguration;
-import javax.inject.Inject;
-import javax.inject.Singleton;
-import javax.ws.rs.GET;
-import javax.ws.rs.Path;
-import javax.ws.rs.Produces;
-import javax.ws.rs.core.MediaType;
+import jakarta.ws.rs.GET;
+import jakarta.ws.rs.Path;
+import jakarta.ws.rs.Produces;
+import jakarta.ws.rs.core.MediaType;
diff --git a/src/main/java/org/grobid/service/exceptions/GrobidServiceException.java b/src/main/java/org/grobid/service/exceptions/GrobidServiceException.java
index 86594f0d..8ff8d501 100755
--- a/src/main/java/org/grobid/service/exceptions/GrobidServiceException.java
+++ b/src/main/java/org/grobid/service/exceptions/GrobidServiceException.java
@@ -2,7 +2,7 @@
import org.grobid.core.exceptions.GrobidException;
-import javax.ws.rs.core.Response;
+import jakarta.ws.rs.core.Response;
public class GrobidServiceException extends GrobidException {
diff --git a/src/main/java/org/grobid/service/exceptions/GrobidServicePropertyException.java b/src/main/java/org/grobid/service/exceptions/GrobidServicePropertyException.java
index 67d20b96..d0b3965a 100755
--- a/src/main/java/org/grobid/service/exceptions/GrobidServicePropertyException.java
+++ b/src/main/java/org/grobid/service/exceptions/GrobidServicePropertyException.java
@@ -1,6 +1,6 @@
package org.grobid.service.exceptions;
-import javax.ws.rs.core.Response;
+import jakarta.ws.rs.core.Response;
public class GrobidServicePropertyException extends GrobidServiceException {
diff --git a/src/main/java/org/grobid/service/exceptions/mapper/GrobidExceptionMapper.java b/src/main/java/org/grobid/service/exceptions/mapper/GrobidExceptionMapper.java
index 0a0eff9e..30820b2d 100644
--- a/src/main/java/org/grobid/service/exceptions/mapper/GrobidExceptionMapper.java
+++ b/src/main/java/org/grobid/service/exceptions/mapper/GrobidExceptionMapper.java
@@ -5,12 +5,12 @@
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
-import javax.ws.rs.core.Context;
-import javax.ws.rs.core.HttpHeaders;
-import javax.ws.rs.core.Response;
-import javax.ws.rs.core.UriInfo;
-import javax.ws.rs.ext.ExceptionMapper;
-import javax.ws.rs.ext.Provider;
+import jakarta.ws.rs.core.Context;
+import jakarta.ws.rs.core.HttpHeaders;
+import jakarta.ws.rs.core.Response;
+import jakarta.ws.rs.core.UriInfo;
+import jakarta.ws.rs.ext.ExceptionMapper;
+import jakarta.ws.rs.ext.Provider;
public class GrobidExceptionMapper implements ExceptionMapper {
diff --git a/src/main/java/org/grobid/service/exceptions/mapper/GrobidExceptionsTranslationUtility.java b/src/main/java/org/grobid/service/exceptions/mapper/GrobidExceptionsTranslationUtility.java
index 64f103e0..92929b38 100644
--- a/src/main/java/org/grobid/service/exceptions/mapper/GrobidExceptionsTranslationUtility.java
+++ b/src/main/java/org/grobid/service/exceptions/mapper/GrobidExceptionsTranslationUtility.java
@@ -4,13 +4,13 @@
import com.fasterxml.jackson.databind.node.ObjectNode;
import com.google.common.base.Joiner;
import com.google.common.base.Throwables;
+import com.google.inject.Inject;
import org.grobid.core.exceptions.GrobidExceptionStatus;
import org.slf4j.MDC;
-import javax.inject.Inject;
-import javax.ws.rs.core.MediaType;
-import javax.ws.rs.core.Response;
-import javax.ws.rs.ext.Provider;
+import jakarta.ws.rs.core.MediaType;
+import jakarta.ws.rs.core.Response;
+import jakarta.ws.rs.ext.Provider;
import java.io.IOException;
import java.util.ArrayList;
import java.util.List;
diff --git a/src/main/java/org/grobid/service/exceptions/mapper/GrobidServiceExceptionMapper.java b/src/main/java/org/grobid/service/exceptions/mapper/GrobidServiceExceptionMapper.java
index ebe26ffb..7e92c1fe 100644
--- a/src/main/java/org/grobid/service/exceptions/mapper/GrobidServiceExceptionMapper.java
+++ b/src/main/java/org/grobid/service/exceptions/mapper/GrobidServiceExceptionMapper.java
@@ -5,12 +5,12 @@
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
-import javax.ws.rs.core.Context;
-import javax.ws.rs.core.HttpHeaders;
-import javax.ws.rs.core.Response;
-import javax.ws.rs.core.UriInfo;
-import javax.ws.rs.ext.ExceptionMapper;
-import javax.ws.rs.ext.Provider;
+import jakarta.ws.rs.core.Context;
+import jakarta.ws.rs.core.HttpHeaders;
+import jakarta.ws.rs.core.Response;
+import jakarta.ws.rs.core.UriInfo;
+import jakarta.ws.rs.ext.ExceptionMapper;
+import jakarta.ws.rs.ext.Provider;
public class GrobidServiceExceptionMapper implements ExceptionMapper {
diff --git a/src/main/java/org/grobid/service/exceptions/mapper/GrobidStatusToHttpStatusMapper.java b/src/main/java/org/grobid/service/exceptions/mapper/GrobidStatusToHttpStatusMapper.java
index 9642d13a..54a0a869 100644
--- a/src/main/java/org/grobid/service/exceptions/mapper/GrobidStatusToHttpStatusMapper.java
+++ b/src/main/java/org/grobid/service/exceptions/mapper/GrobidStatusToHttpStatusMapper.java
@@ -2,7 +2,7 @@
import org.grobid.core.exceptions.GrobidExceptionStatus;
-import javax.ws.rs.core.Response;
+import jakarta.ws.rs.core.Response;
public class GrobidStatusToHttpStatusMapper {
public static Response.Status getStatusCode(GrobidExceptionStatus status) {
diff --git a/src/main/java/org/grobid/service/exceptions/mapper/WebApplicationExceptionMapper.java b/src/main/java/org/grobid/service/exceptions/mapper/WebApplicationExceptionMapper.java
index 7d72e026..7489b427 100644
--- a/src/main/java/org/grobid/service/exceptions/mapper/WebApplicationExceptionMapper.java
+++ b/src/main/java/org/grobid/service/exceptions/mapper/WebApplicationExceptionMapper.java
@@ -2,10 +2,10 @@
import com.google.inject.Inject;
-import javax.ws.rs.WebApplicationException;
-import javax.ws.rs.core.Response;
-import javax.ws.rs.ext.ExceptionMapper;
-import javax.ws.rs.ext.Provider;
+import jakarta.ws.rs.WebApplicationException;
+import jakarta.ws.rs.core.Response;
+import jakarta.ws.rs.ext.ExceptionMapper;
+import jakarta.ws.rs.ext.Provider;
public class WebApplicationExceptionMapper implements ExceptionMapper {
diff --git a/src/main/resources/web/index.html b/src/main/resources/web/index.html
index a57532c0..535bd76e 100644
--- a/src/main/resources/web/index.html
+++ b/src/main/resources/web/index.html
@@ -7,7 +7,7 @@
@@ -445,7 +445,7 @@
unknown version
+ © GROBID contributors, 2019 - 2024 | unknown version
diff --git a/src/main/resources/web/resources/libs/jquery/jquery-1.10.0.min.js b/src/main/resources/web/resources/libs/jquery/jquery-1.10.0.min.js
deleted file mode 100644
index 01c68816..00000000
--- a/src/main/resources/web/resources/libs/jquery/jquery-1.10.0.min.js
+++ /dev/null
@@ -1,6 +0,0 @@
diff --git a/src/main/resources/web/resources/libs/jquery/jquery-3.4.1.js b/src/main/resources/web/resources/libs/jquery/jquery-3.4.1.js
deleted file mode 100644
index 773ad95c..00000000
--- a/src/main/resources/web/resources/libs/jquery/jquery-3.4.1.js
+++ /dev/null
@@ -1,10598 +0,0 @@
- * jQuery JavaScript Library v3.4.1
- * https://jquery.com/
- *
- * Includes Sizzle.js
- * https://sizzlejs.com/
- *
- * Copyright JS Foundation and other contributors
- * Released under the MIT license
- * https://jquery.org/license
- *
- * Date: 2019-05-01T21:04Z
- */
-( function( global, factory ) {
- "use strict";
- if ( typeof module === "object" && typeof module.exports === "object" ) {
- // For CommonJS and CommonJS-like environments where a proper `window`
- // is present, execute the factory and get jQuery.
- // For environments that do not have a `window` with a `document`
- // (such as Node.js), expose a factory as module.exports.
- // This accentuates the need for the creation of a real `window`.
- // e.g. var jQuery = require("jquery")(window);
- // See ticket #14549 for more info.
- module.exports = global.document ?
- factory( global, true ) :
- function( w ) {
- if ( !w.document ) {
- throw new Error( "jQuery requires a window with a document" );
- }
- return factory( w );
- };
- } else {
- factory( global );
- }
-// Pass this if window is not defined yet
-} )( typeof window !== "undefined" ? window : this, function( window, noGlobal ) {
-// Edge <= 12 - 13+, Firefox <=18 - 45+, IE 10 - 11, Safari 5.1 - 9+, iOS 6 - 9.1
-// throw exceptions when non-strict code (e.g., ASP.NET 4.5) accesses strict mode
-// arguments.callee.caller (trac-13335). But as of jQuery 3.0 (2016), strict mode should be common
-// enough that all such attempts are guarded in a try block.
-"use strict";
-var arr = [];
-var document = window.document;
-var getProto = Object.getPrototypeOf;
-var slice = arr.slice;
-var concat = arr.concat;
-var push = arr.push;
-var indexOf = arr.indexOf;
-var class2type = {};
-var toString = class2type.toString;
-var hasOwn = class2type.hasOwnProperty;
-var fnToString = hasOwn.toString;
-var ObjectFunctionString = fnToString.call( Object );
-var support = {};
-var isFunction = function isFunction( obj ) {
- // Support: Chrome <=57, Firefox <=52
- // In some browsers, typeof returns "function" for HTML
- // (i.e., `typeof document.createElement( "object" ) === "function"`).
- // We don't want to classify *any* DOM node as a function.
- return typeof obj === "function" && typeof obj.nodeType !== "number";
- };
-var isWindow = function isWindow( obj ) {
- return obj != null && obj === obj.window;
- };
- var preservedScriptAttributes = {
- type: true,
- src: true,
- nonce: true,
- noModule: true
- };
- function DOMEval( code, node, doc ) {
- doc = doc || document;
- var i, val,
- script = doc.createElement( "script" );
- script.text = code;
- if ( node ) {
- for ( i in preservedScriptAttributes ) {
- // Support: Firefox 64+, Edge 18+
- // Some browsers don't support the "nonce" property on scripts.
- // On the other hand, just using `getAttribute` is not enough as
- // the `nonce` attribute is reset to an empty string whenever it
- // becomes browsing-context connected.
- // See https://github.com/whatwg/html/issues/2369
- // See https://html.spec.whatwg.org/#nonce-attributes
- // The `node.getAttribute` check was added for the sake of
- // `jQuery.globalEval` so that it can fake a nonce-containing node
- // via an object.
- val = node[ i ] || node.getAttribute && node.getAttribute( i );
- if ( val ) {
- script.setAttribute( i, val );
- }
- }
- }
- doc.head.appendChild( script ).parentNode.removeChild( script );
- }
-function toType( obj ) {
- if ( obj == null ) {
- return obj + "";
- }
- // Support: Android <=2.3 only (functionish RegExp)
- return typeof obj === "object" || typeof obj === "function" ?
- class2type[ toString.call( obj ) ] || "object" :
- typeof obj;
-/* global Symbol */
-// Defining this global in .eslintrc.json would create a danger of using the global
-// unguarded in another place, it seems safer to define global only for this module
- version = "3.4.1",
- // Define a local copy of jQuery
- jQuery = function( selector, context ) {
- // The jQuery object is actually just the init constructor 'enhanced'
- // Need init if jQuery is called (just allow error to be thrown if not included)
- return new jQuery.fn.init( selector, context );
- },
- // Support: Android <=4.0 only
- // Make sure we trim BOM and NBSP
- rtrim = /^[\s\uFEFF\xA0]+|[\s\uFEFF\xA0]+$/g;
-jQuery.fn = jQuery.prototype = {
- // The current version of jQuery being used
- jquery: version,
- constructor: jQuery,
- // The default length of a jQuery object is 0
- length: 0,
- toArray: function() {
- return slice.call( this );
- },
- // Get the Nth element in the matched element set OR
- // Get the whole matched element set as a clean array
- get: function( num ) {
- // Return all the elements in a clean array
- if ( num == null ) {
- return slice.call( this );
- }
- // Return just the one element from the set
- return num < 0 ? this[ num + this.length ] : this[ num ];
- },
- // Take an array of elements and push it onto the stack
- // (returning the new matched element set)
- pushStack: function( elems ) {
- // Build a new jQuery matched element set
- var ret = jQuery.merge( this.constructor(), elems );
- // Add the old object onto the stack (as a reference)
- ret.prevObject = this;
- // Return the newly-formed element set
- return ret;
- },
- // Execute a callback for every element in the matched set.
- each: function( callback ) {
- return jQuery.each( this, callback );
- },
- map: function( callback ) {
- return this.pushStack( jQuery.map( this, function( elem, i ) {
- return callback.call( elem, i, elem );
- } ) );
- },
- slice: function() {
- return this.pushStack( slice.apply( this, arguments ) );
- },
- first: function() {
- return this.eq( 0 );
- },
- last: function() {
- return this.eq( -1 );
- },
- eq: function( i ) {
- var len = this.length,
- j = +i + ( i < 0 ? len : 0 );
- return this.pushStack( j >= 0 && j < len ? [ this[ j ] ] : [] );
- },
- end: function() {
- return this.prevObject || this.constructor();
- },
- // For internal use only.
- // Behaves like an Array's method, not like a jQuery method.
- push: push,
- sort: arr.sort,
- splice: arr.splice
-jQuery.extend = jQuery.fn.extend = function() {
- var options, name, src, copy, copyIsArray, clone,
- target = arguments[ 0 ] || {},
- i = 1,
- length = arguments.length,
- deep = false;
- // Handle a deep copy situation
- if ( typeof target === "boolean" ) {
- deep = target;
- // Skip the boolean and the target
- target = arguments[ i ] || {};
- i++;
- }
- // Handle case when target is a string or something (possible in deep copy)
- if ( typeof target !== "object" && !isFunction( target ) ) {
- target = {};
- }
- // Extend jQuery itself if only one argument is passed
- if ( i === length ) {
- target = this;
- i--;
- }
- for ( ; i < length; i++ ) {
- // Only deal with non-null/undefined values
- if ( ( options = arguments[ i ] ) != null ) {
- // Extend the base object
- for ( name in options ) {
- copy = options[ name ];
- // Prevent Object.prototype pollution
- // Prevent never-ending loop
- if ( name === "__proto__" || target === copy ) {
- continue;
- }
- // Recurse if we're merging plain objects or arrays
- if ( deep && copy && ( jQuery.isPlainObject( copy ) ||
- ( copyIsArray = Array.isArray( copy ) ) ) ) {
- src = target[ name ];
- // Ensure proper type for the source value
- if ( copyIsArray && !Array.isArray( src ) ) {
- clone = [];
- } else if ( !copyIsArray && !jQuery.isPlainObject( src ) ) {
- clone = {};
- } else {
- clone = src;
- }
- copyIsArray = false;
- // Never move original objects, clone them
- target[ name ] = jQuery.extend( deep, clone, copy );
- // Don't bring in undefined values
- } else if ( copy !== undefined ) {
- target[ name ] = copy;
- }
- }
- }
- }
- // Return the modified object
- return target;
-jQuery.extend( {
- // Unique for each copy of jQuery on the page
- expando: "jQuery" + ( version + Math.random() ).replace( /\D/g, "" ),
- // Assume jQuery is ready without the ready module
- isReady: true,
- error: function( msg ) {
- throw new Error( msg );
- },
- noop: function() {},
- isPlainObject: function( obj ) {
- var proto, Ctor;
- // Detect obvious negatives
- // Use toString instead of jQuery.type to catch host objects
- if ( !obj || toString.call( obj ) !== "[object Object]" ) {
- return false;
- }
- proto = getProto( obj );
- // Objects with no prototype (e.g., `Object.create( null )`) are plain
- if ( !proto ) {
- return true;
- }
- // Objects with prototype are plain iff they were constructed by a global Object function
- Ctor = hasOwn.call( proto, "constructor" ) && proto.constructor;
- return typeof Ctor === "function" && fnToString.call( Ctor ) === ObjectFunctionString;
- },
- isEmptyObject: function( obj ) {
- var name;
- for ( name in obj ) {
- return false;
- }
- return true;
- },
- // Evaluates a script in a global context
- globalEval: function( code, options ) {
- DOMEval( code, { nonce: options && options.nonce } );
- },
- each: function( obj, callback ) {
- var length, i = 0;
- if ( isArrayLike( obj ) ) {
- length = obj.length;
- for ( ; i < length; i++ ) {
- if ( callback.call( obj[ i ], i, obj[ i ] ) === false ) {
- break;
- }
- }
- } else {
- for ( i in obj ) {
- if ( callback.call( obj[ i ], i, obj[ i ] ) === false ) {
- break;
- }
- }
- }
- return obj;
- },
- // Support: Android <=4.0 only
- trim: function( text ) {
- return text == null ?
- "" :
- ( text + "" ).replace( rtrim, "" );
- },
- // results is for internal usage only
- makeArray: function( arr, results ) {
- var ret = results || [];
- if ( arr != null ) {
- if ( isArrayLike( Object( arr ) ) ) {
- jQuery.merge( ret,
- typeof arr === "string" ?
- [ arr ] : arr
- );
- } else {
- push.call( ret, arr );
- }
- }
- return ret;
- },
- inArray: function( elem, arr, i ) {
- return arr == null ? -1 : indexOf.call( arr, elem, i );
- },
- // Support: Android <=4.0 only, PhantomJS 1 only
- // push.apply(_, arraylike) throws on ancient WebKit
- merge: function( first, second ) {
- var len = +second.length,
- j = 0,
- i = first.length;
- for ( ; j < len; j++ ) {
- first[ i++ ] = second[ j ];
- }
- first.length = i;
- return first;
- },
- grep: function( elems, callback, invert ) {
- var callbackInverse,
- matches = [],
- i = 0,
- length = elems.length,
- callbackExpect = !invert;
- // Go through the array, only saving the items
- // that pass the validator function
- for ( ; i < length; i++ ) {
- callbackInverse = !callback( elems[ i ], i );
- if ( callbackInverse !== callbackExpect ) {
- matches.push( elems[ i ] );
- }
- }
- return matches;
- },
- // arg is for internal usage only
- map: function( elems, callback, arg ) {
- var length, value,
- i = 0,
- ret = [];
- // Go through the array, translating each of the items to their new values
- if ( isArrayLike( elems ) ) {
- length = elems.length;
- for ( ; i < length; i++ ) {
- value = callback( elems[ i ], i, arg );
- if ( value != null ) {
- ret.push( value );
- }
- }
- // Go through every key on the object,
- } else {
- for ( i in elems ) {
- value = callback( elems[ i ], i, arg );
- if ( value != null ) {
- ret.push( value );
- }
- }
- }
- // Flatten any nested arrays
- return concat.apply( [], ret );
- },
- // A global GUID counter for objects
- guid: 1,
- // jQuery.support is not used in Core but other projects attach their
- // properties to it so it needs to exist.
- support: support
-} );
-if ( typeof Symbol === "function" ) {
- jQuery.fn[ Symbol.iterator ] = arr[ Symbol.iterator ];
-// Populate the class2type map
-jQuery.each( "Boolean Number String Function Array Date RegExp Object Error Symbol".split( " " ),
-function( i, name ) {
- class2type[ "[object " + name + "]" ] = name.toLowerCase();
-} );
-function isArrayLike( obj ) {
- // Support: real iOS 8.2 only (not reproducible in simulator)
- // `in` check used to prevent JIT error (gh-2145)
- // hasOwn isn't used here due to false negatives
- // regarding Nodelist length in IE
- var length = !!obj && "length" in obj && obj.length,
- type = toType( obj );
- if ( isFunction( obj ) || isWindow( obj ) ) {
- return false;
- }
- return type === "array" || length === 0 ||
- typeof length === "number" && length > 0 && ( length - 1 ) in obj;
-var Sizzle =
- * Sizzle CSS Selector Engine v2.3.4
- * https://sizzlejs.com/
- *
- * Copyright JS Foundation and other contributors
- * Released under the MIT license
- * https://js.foundation/
- *
- * Date: 2019-04-08
- */
-(function( window ) {
-var i,
- support,
- Expr,
- getText,
- isXML,
- tokenize,
- compile,
- select,
- outermostContext,
- sortInput,
- hasDuplicate,
- // Local document vars
- setDocument,
- document,
- docElem,
- documentIsHTML,
- rbuggyQSA,
- rbuggyMatches,
- matches,
- contains,
- // Instance-specific data
- expando = "sizzle" + 1 * new Date(),
- preferredDoc = window.document,
- dirruns = 0,
- done = 0,
- classCache = createCache(),
- tokenCache = createCache(),
- compilerCache = createCache(),
- nonnativeSelectorCache = createCache(),
- sortOrder = function( a, b ) {
- if ( a === b ) {
- hasDuplicate = true;
- }
- return 0;
- },
- // Instance methods
- hasOwn = ({}).hasOwnProperty,
- arr = [],
- pop = arr.pop,
- push_native = arr.push,
- push = arr.push,
- slice = arr.slice,
- // Use a stripped-down indexOf as it's faster than native
- // https://jsperf.com/thor-indexof-vs-for/5
- indexOf = function( list, elem ) {
- var i = 0,
- len = list.length;
- for ( ; i < len; i++ ) {
- if ( list[i] === elem ) {
- return i;
- }
- }
- return -1;
- },
- booleans = "checked|selected|async|autofocus|autoplay|controls|defer|disabled|hidden|ismap|loop|multiple|open|readonly|required|scoped",
- // Regular expressions
- // http://www.w3.org/TR/css3-selectors/#whitespace
- whitespace = "[\\x20\\t\\r\\n\\f]",
- // http://www.w3.org/TR/CSS21/syndata.html#value-def-identifier
- identifier = "(?:\\\\.|[\\w-]|[^\0-\\xa0])+",
- // Attribute selectors: http://www.w3.org/TR/selectors/#attribute-selectors
- attributes = "\\[" + whitespace + "*(" + identifier + ")(?:" + whitespace +
- // Operator (capture 2)
- "*([*^$|!~]?=)" + whitespace +
- // "Attribute values must be CSS identifiers [capture 5] or strings [capture 3 or capture 4]"
- "*(?:'((?:\\\\.|[^\\\\'])*)'|\"((?:\\\\.|[^\\\\\"])*)\"|(" + identifier + "))|)" + whitespace +
- "*\\]",
- pseudos = ":(" + identifier + ")(?:\\((" +
- // To reduce the number of selectors needing tokenize in the preFilter, prefer arguments:
- // 1. quoted (capture 3; capture 4 or capture 5)
- "('((?:\\\\.|[^\\\\'])*)'|\"((?:\\\\.|[^\\\\\"])*)\")|" +
- // 2. simple (capture 6)
- "((?:\\\\.|[^\\\\()[\\]]|" + attributes + ")*)|" +
- // 3. anything else (capture 2)
- ".*" +
- ")\\)|)",
- // Leading and non-escaped trailing whitespace, capturing some non-whitespace characters preceding the latter
- rwhitespace = new RegExp( whitespace + "+", "g" ),
- rtrim = new RegExp( "^" + whitespace + "+|((?:^|[^\\\\])(?:\\\\.)*)" + whitespace + "+$", "g" ),
- rcomma = new RegExp( "^" + whitespace + "*," + whitespace + "*" ),
- rcombinators = new RegExp( "^" + whitespace + "*([>+~]|" + whitespace + ")" + whitespace + "*" ),
- rdescend = new RegExp( whitespace + "|>" ),
- rpseudo = new RegExp( pseudos ),
- ridentifier = new RegExp( "^" + identifier + "$" ),
- matchExpr = {
- "ID": new RegExp( "^#(" + identifier + ")" ),
- "CLASS": new RegExp( "^\\.(" + identifier + ")" ),
- "TAG": new RegExp( "^(" + identifier + "|[*])" ),
- "ATTR": new RegExp( "^" + attributes ),
- "PSEUDO": new RegExp( "^" + pseudos ),
- "CHILD": new RegExp( "^:(only|first|last|nth|nth-last)-(child|of-type)(?:\\(" + whitespace +
- "*(even|odd|(([+-]|)(\\d*)n|)" + whitespace + "*(?:([+-]|)" + whitespace +
- "*(\\d+)|))" + whitespace + "*\\)|)", "i" ),
- "bool": new RegExp( "^(?:" + booleans + ")$", "i" ),
- // For use in libraries implementing .is()
- // We use this for POS matching in `select`
- "needsContext": new RegExp( "^" + whitespace + "*[>+~]|:(even|odd|eq|gt|lt|nth|first|last)(?:\\(" +
- whitespace + "*((?:-\\d)?\\d*)" + whitespace + "*\\)|)(?=[^-]|$)", "i" )
- },
- rhtml = /HTML$/i,
- rinputs = /^(?:input|select|textarea|button)$/i,
- rheader = /^h\d$/i,
- rnative = /^[^{]+\{\s*\[native \w/,
- // Easily-parseable/retrievable ID or TAG or CLASS selectors
- rquickExpr = /^(?:#([\w-]+)|(\w+)|\.([\w-]+))$/,
- rsibling = /[+~]/,
- // CSS escapes
- // http://www.w3.org/TR/CSS21/syndata.html#escaped-characters
- runescape = new RegExp( "\\\\([\\da-f]{1,6}" + whitespace + "?|(" + whitespace + ")|.)", "ig" ),
- funescape = function( _, escaped, escapedWhitespace ) {
- var high = "0x" + escaped - 0x10000;
- // NaN means non-codepoint
- // Support: Firefox<24
- // Workaround erroneous numeric interpretation of +"0x"
- return high !== high || escapedWhitespace ?
- escaped :
- high < 0 ?
- // BMP codepoint
- String.fromCharCode( high + 0x10000 ) :
- // Supplemental Plane codepoint (surrogate pair)
- String.fromCharCode( high >> 10 | 0xD800, high & 0x3FF | 0xDC00 );
- },
- // CSS string/identifier serialization
- // https://drafts.csswg.org/cssom/#common-serializing-idioms
- rcssescape = /([\0-\x1f\x7f]|^-?\d)|^-$|[^\0-\x1f\x7f-\uFFFF\w-]/g,
- fcssescape = function( ch, asCodePoint ) {
- if ( asCodePoint ) {
- if ( ch === "\0" ) {
- return "\uFFFD";
- }
- // Control characters and (dependent upon position) numbers get escaped as code points
- return ch.slice( 0, -1 ) + "\\" + ch.charCodeAt( ch.length - 1 ).toString( 16 ) + " ";
- }
- // Other potentially-special ASCII characters get backslash-escaped
- return "\\" + ch;
- },
- // Used for iframes
- // See setDocument()
- // Removing the function wrapper causes a "Permission Denied"
- // error in IE
- unloadHandler = function() {
- setDocument();
- },
- inDisabledFieldset = addCombinator(
- function( elem ) {
- return elem.disabled === true && elem.nodeName.toLowerCase() === "fieldset";
- },
- { dir: "parentNode", next: "legend" }
- );
-// Optimize for push.apply( _, NodeList )
-try {
- push.apply(
- (arr = slice.call( preferredDoc.childNodes )),
- preferredDoc.childNodes
- );
- // Support: Android<4.0
- // Detect silently failing push.apply
- arr[ preferredDoc.childNodes.length ].nodeType;
-} catch ( e ) {
- push = { apply: arr.length ?
- // Leverage slice if possible
- function( target, els ) {
- push_native.apply( target, slice.call(els) );
- } :
- // Support: IE<9
- // Otherwise append directly
- function( target, els ) {
- var j = target.length,
- i = 0;
- // Can't trust NodeList.length
- while ( (target[j++] = els[i++]) ) {}
- target.length = j - 1;
- }
- };
-function Sizzle( selector, context, results, seed ) {
- var m, i, elem, nid, match, groups, newSelector,
- newContext = context && context.ownerDocument,
- // nodeType defaults to 9, since context defaults to document
- nodeType = context ? context.nodeType : 9;
- results = results || [];
- // Return early from calls with invalid selector or context
- if ( typeof selector !== "string" || !selector ||
- nodeType !== 1 && nodeType !== 9 && nodeType !== 11 ) {
- return results;
- }
- // Try to shortcut find operations (as opposed to filters) in HTML documents
- if ( !seed ) {
- if ( ( context ? context.ownerDocument || context : preferredDoc ) !== document ) {
- setDocument( context );
- }
- context = context || document;
- if ( documentIsHTML ) {
- // If the selector is sufficiently simple, try using a "get*By*" DOM method
- // (excepting DocumentFragment context, where the methods don't exist)
- if ( nodeType !== 11 && (match = rquickExpr.exec( selector )) ) {
- // ID selector
- if ( (m = match[1]) ) {
- // Document context
- if ( nodeType === 9 ) {
- if ( (elem = context.getElementById( m )) ) {
- // Support: IE, Opera, Webkit
- // TODO: identify versions
- // getElementById can match elements by name instead of ID
- if ( elem.id === m ) {
- results.push( elem );
- return results;
- }
- } else {
- return results;
- }
- // Element context
- } else {
- // Support: IE, Opera, Webkit
- // TODO: identify versions
- // getElementById can match elements by name instead of ID
- if ( newContext && (elem = newContext.getElementById( m )) &&
- contains( context, elem ) &&
- elem.id === m ) {
- results.push( elem );
- return results;
- }
- }
- // Type selector
- } else if ( match[2] ) {
- push.apply( results, context.getElementsByTagName( selector ) );
- return results;
- // Class selector
- } else if ( (m = match[3]) && support.getElementsByClassName &&
- context.getElementsByClassName ) {
- push.apply( results, context.getElementsByClassName( m ) );
- return results;
- }
- }
- // Take advantage of querySelectorAll
- if ( support.qsa &&
- !nonnativeSelectorCache[ selector + " " ] &&
- (!rbuggyQSA || !rbuggyQSA.test( selector )) &&
- // Support: IE 8 only
- // Exclude object elements
- (nodeType !== 1 || context.nodeName.toLowerCase() !== "object") ) {
- newSelector = selector;
- newContext = context;
- // qSA considers elements outside a scoping root when evaluating child or
- // descendant combinators, which is not what we want.
- // In such cases, we work around the behavior by prefixing every selector in the
- // list with an ID selector referencing the scope context.
- // Thanks to Andrew Dupont for this technique.
- if ( nodeType === 1 && rdescend.test( selector ) ) {
- // Capture the context ID, setting it first if necessary
- if ( (nid = context.getAttribute( "id" )) ) {
- nid = nid.replace( rcssescape, fcssescape );
- } else {
- context.setAttribute( "id", (nid = expando) );
- }
- // Prefix every selector in the list
- groups = tokenize( selector );
- i = groups.length;
- while ( i-- ) {
- groups[i] = "#" + nid + " " + toSelector( groups[i] );
- }
- newSelector = groups.join( "," );
- // Expand context for sibling selectors
- newContext = rsibling.test( selector ) && testContext( context.parentNode ) ||
- context;
- }
- try {
- push.apply( results,
- newContext.querySelectorAll( newSelector )
- );
- return results;
- } catch ( qsaError ) {
- nonnativeSelectorCache( selector, true );
- } finally {
- if ( nid === expando ) {
- context.removeAttribute( "id" );
- }
- }
- }
- }
- }
- // All others
- return select( selector.replace( rtrim, "$1" ), context, results, seed );
- * Create key-value caches of limited size
- * @returns {function(string, object)} Returns the Object data after storing it on itself with
- * property name the (space-suffixed) string and (if the cache is larger than Expr.cacheLength)
- * deleting the oldest entry
- */
-function createCache() {
- var keys = [];
- function cache( key, value ) {
- // Use (key + " ") to avoid collision with native prototype properties (see Issue #157)
- if ( keys.push( key + " " ) > Expr.cacheLength ) {
- // Only keep the most recent entries
- delete cache[ keys.shift() ];
- }
- return (cache[ key + " " ] = value);
- }
- return cache;
- * Mark a function for special use by Sizzle
- * @param {Function} fn The function to mark
- */
-function markFunction( fn ) {
- fn[ expando ] = true;
- return fn;
- * Support testing using an element
- * @param {Function} fn Passed the created element and returns a boolean result
- */
-function assert( fn ) {
- var el = document.createElement("fieldset");
- try {
- return !!fn( el );
- } catch (e) {
- return false;
- } finally {
- // Remove from its parent by default
- if ( el.parentNode ) {
- el.parentNode.removeChild( el );
- }
- // release memory in IE
- el = null;
- }
- * Adds the same handler for all of the specified attrs
- * @param {String} attrs Pipe-separated list of attributes
- * @param {Function} handler The method that will be applied
- */
-function addHandle( attrs, handler ) {
- var arr = attrs.split("|"),
- i = arr.length;
- while ( i-- ) {
- Expr.attrHandle[ arr[i] ] = handler;
- }
- * Checks document order of two siblings
- * @param {Element} a
- * @param {Element} b
- * @returns {Number} Returns less than 0 if a precedes b, greater than 0 if a follows b
- */
-function siblingCheck( a, b ) {
- var cur = b && a,
- diff = cur && a.nodeType === 1 && b.nodeType === 1 &&
- a.sourceIndex - b.sourceIndex;
- // Use IE sourceIndex if available on both nodes
- if ( diff ) {
- return diff;
- }
- // Check if b follows a
- if ( cur ) {
- while ( (cur = cur.nextSibling) ) {
- if ( cur === b ) {
- return -1;
- }
- }
- }
- return a ? 1 : -1;
- * Returns a function to use in pseudos for input types
- * @param {String} type
- */
-function createInputPseudo( type ) {
- return function( elem ) {
- var name = elem.nodeName.toLowerCase();
- return name === "input" && elem.type === type;
- };
- * Returns a function to use in pseudos for buttons
- * @param {String} type
- */
-function createButtonPseudo( type ) {
- return function( elem ) {
- var name = elem.nodeName.toLowerCase();
- return (name === "input" || name === "button") && elem.type === type;
- };
- * Returns a function to use in pseudos for :enabled/:disabled
- * @param {Boolean} disabled true for :disabled; false for :enabled
- */
-function createDisabledPseudo( disabled ) {
- // Known :disabled false positives: fieldset[disabled] > legend:nth-of-type(n+2) :can-disable
- return function( elem ) {
- // Only certain elements can match :enabled or :disabled
- // https://html.spec.whatwg.org/multipage/scripting.html#selector-enabled
- // https://html.spec.whatwg.org/multipage/scripting.html#selector-disabled
- if ( "form" in elem ) {
- // Check for inherited disabledness on relevant non-disabled elements:
- // * listed form-associated elements in a disabled fieldset
- // https://html.spec.whatwg.org/multipage/forms.html#category-listed
- // https://html.spec.whatwg.org/multipage/forms.html#concept-fe-disabled
- // * option elements in a disabled optgroup
- // https://html.spec.whatwg.org/multipage/forms.html#concept-option-disabled
- // All such elements have a "form" property.
- if ( elem.parentNode && elem.disabled === false ) {
- // Option elements defer to a parent optgroup if present
- if ( "label" in elem ) {
- if ( "label" in elem.parentNode ) {
- return elem.parentNode.disabled === disabled;
- } else {
- return elem.disabled === disabled;
- }
- }
- // Support: IE 6 - 11
- // Use the isDisabled shortcut property to check for disabled fieldset ancestors
- return elem.isDisabled === disabled ||
- // Where there is no isDisabled, check manually
- /* jshint -W018 */
- elem.isDisabled !== !disabled &&
- inDisabledFieldset( elem ) === disabled;
- }
- return elem.disabled === disabled;
- // Try to winnow out elements that can't be disabled before trusting the disabled property.
- // Some victims get caught in our net (label, legend, menu, track), but it shouldn't
- // even exist on them, let alone have a boolean value.
- } else if ( "label" in elem ) {
- return elem.disabled === disabled;
- }
- // Remaining elements are neither :enabled nor :disabled
- return false;
- };
- * Returns a function to use in pseudos for positionals
- * @param {Function} fn
- */
-function createPositionalPseudo( fn ) {
- return markFunction(function( argument ) {
- argument = +argument;
- return markFunction(function( seed, matches ) {
- var j,
- matchIndexes = fn( [], seed.length, argument ),
- i = matchIndexes.length;
- // Match elements found at the specified indexes
- while ( i-- ) {
- if ( seed[ (j = matchIndexes[i]) ] ) {
- seed[j] = !(matches[j] = seed[j]);
- }
- }
- });
- });
- * Checks a node for validity as a Sizzle context
- * @param {Element|Object=} context
- * @returns {Element|Object|Boolean} The input node if acceptable, otherwise a falsy value
- */
-function testContext( context ) {
- return context && typeof context.getElementsByTagName !== "undefined" && context;
-// Expose support vars for convenience
-support = Sizzle.support = {};
- * Detects XML nodes
- * @param {Element|Object} elem An element or a document
- * @returns {Boolean} True iff elem is a non-HTML XML node
- */
-isXML = Sizzle.isXML = function( elem ) {
- var namespace = elem.namespaceURI,
- docElem = (elem.ownerDocument || elem).documentElement;
- // Support: IE <=8
- // Assume HTML when documentElement doesn't yet exist, such as inside loading iframes
- // https://bugs.jquery.com/ticket/4833
- return !rhtml.test( namespace || docElem && docElem.nodeName || "HTML" );
- * Sets document-related variables once based on the current document
- * @param {Element|Object} [doc] An element or document object to use to set the document
- * @returns {Object} Returns the current document
- */
-setDocument = Sizzle.setDocument = function( node ) {
- var hasCompare, subWindow,
- doc = node ? node.ownerDocument || node : preferredDoc;
- // Return early if doc is invalid or already selected
- if ( doc === document || doc.nodeType !== 9 || !doc.documentElement ) {
- return document;
- }
- // Update global variables
- document = doc;
- docElem = document.documentElement;
- documentIsHTML = !isXML( document );
- // Support: IE 9-11, Edge
- // Accessing iframe documents after unload throws "permission denied" errors (jQuery #13936)
- if ( preferredDoc !== document &&
- (subWindow = document.defaultView) && subWindow.top !== subWindow ) {
- // Support: IE 11, Edge
- if ( subWindow.addEventListener ) {
- subWindow.addEventListener( "unload", unloadHandler, false );
- // Support: IE 9 - 10 only
- } else if ( subWindow.attachEvent ) {
- subWindow.attachEvent( "onunload", unloadHandler );
- }
- }
- /* Attributes
- ---------------------------------------------------------------------- */
- // Support: IE<8
- // Verify that getAttribute really returns attributes and not properties
- // (excepting IE8 booleans)
- support.attributes = assert(function( el ) {
- el.className = "i";
- return !el.getAttribute("className");
- });
- /* getElement(s)By*
- ---------------------------------------------------------------------- */
- // Check if getElementsByTagName("*") returns only elements
- support.getElementsByTagName = assert(function( el ) {
- el.appendChild( document.createComment("") );
- return !el.getElementsByTagName("*").length;
- });
- // Support: IE<9
- support.getElementsByClassName = rnative.test( document.getElementsByClassName );
- // Support: IE<10
- // Check if getElementById returns elements by name
- // The broken getElementById methods don't pick up programmatically-set names,
- // so use a roundabout getElementsByName test
- support.getById = assert(function( el ) {
- docElem.appendChild( el ).id = expando;
- return !document.getElementsByName || !document.getElementsByName( expando ).length;
- });
- // ID filter and find
- if ( support.getById ) {
- Expr.filter["ID"] = function( id ) {
- var attrId = id.replace( runescape, funescape );
- return function( elem ) {
- return elem.getAttribute("id") === attrId;
- };
- };
- Expr.find["ID"] = function( id, context ) {
- if ( typeof context.getElementById !== "undefined" && documentIsHTML ) {
- var elem = context.getElementById( id );
- return elem ? [ elem ] : [];
- }
- };
- } else {
- Expr.filter["ID"] = function( id ) {
- var attrId = id.replace( runescape, funescape );
- return function( elem ) {
- var node = typeof elem.getAttributeNode !== "undefined" &&
- elem.getAttributeNode("id");
- return node && node.value === attrId;
- };
- };
- // Support: IE 6 - 7 only
- // getElementById is not reliable as a find shortcut
- Expr.find["ID"] = function( id, context ) {
- if ( typeof context.getElementById !== "undefined" && documentIsHTML ) {
- var node, i, elems,
- elem = context.getElementById( id );
- if ( elem ) {
- // Verify the id attribute
- node = elem.getAttributeNode("id");
- if ( node && node.value === id ) {
- return [ elem ];
- }
- // Fall back on getElementsByName
- elems = context.getElementsByName( id );
- i = 0;
- while ( (elem = elems[i++]) ) {
- node = elem.getAttributeNode("id");
- if ( node && node.value === id ) {
- return [ elem ];
- }
- }
- }
- return [];
- }
- };
- }
- // Tag
- Expr.find["TAG"] = support.getElementsByTagName ?
- function( tag, context ) {
- if ( typeof context.getElementsByTagName !== "undefined" ) {
- return context.getElementsByTagName( tag );
- // DocumentFragment nodes don't have gEBTN
- } else if ( support.qsa ) {
- return context.querySelectorAll( tag );
- }
- } :
- function( tag, context ) {
- var elem,
- tmp = [],
- i = 0,
- // By happy coincidence, a (broken) gEBTN appears on DocumentFragment nodes too
- results = context.getElementsByTagName( tag );
- // Filter out possible comments
- if ( tag === "*" ) {
- while ( (elem = results[i++]) ) {
- if ( elem.nodeType === 1 ) {
- tmp.push( elem );
- }
- }
- return tmp;
- }
- return results;
- };
- // Class
- Expr.find["CLASS"] = support.getElementsByClassName && function( className, context ) {
- if ( typeof context.getElementsByClassName !== "undefined" && documentIsHTML ) {
- return context.getElementsByClassName( className );
- }
- };
- /* QSA/matchesSelector
- ---------------------------------------------------------------------- */
- // QSA and matchesSelector support
- // matchesSelector(:active) reports false when true (IE9/Opera 11.5)
- rbuggyMatches = [];
- // qSa(:focus) reports false when true (Chrome 21)
- // We allow this because of a bug in IE8/9 that throws an error
- // whenever `document.activeElement` is accessed on an iframe
- // So, we allow :focus to pass through QSA all the time to avoid the IE error
- // See https://bugs.jquery.com/ticket/13378
- rbuggyQSA = [];
- if ( (support.qsa = rnative.test( document.querySelectorAll )) ) {
- // Build QSA regex
- // Regex strategy adopted from Diego Perini
- assert(function( el ) {
- // Select is set to empty string on purpose
- // This is to test IE's treatment of not explicitly
- // setting a boolean content attribute,
- // since its presence should be enough
- // https://bugs.jquery.com/ticket/12359
- docElem.appendChild( el ).innerHTML = " " +
- "" +
- " ";
- // Support: IE8, Opera 11-12.16
- // Nothing should be selected when empty strings follow ^= or $= or *=
- // The test attribute must be unknown in Opera but "safe" for WinRT
- // https://msdn.microsoft.com/en-us/library/ie/hh465388.aspx#attribute_section
- if ( el.querySelectorAll("[msallowcapture^='']").length ) {
- rbuggyQSA.push( "[*^$]=" + whitespace + "*(?:''|\"\")" );
- }
- // Support: IE8
- // Boolean attributes and "value" are not treated correctly
- if ( !el.querySelectorAll("[selected]").length ) {
- rbuggyQSA.push( "\\[" + whitespace + "*(?:value|" + booleans + ")" );
- }
- // Support: Chrome<29, Android<4.4, Safari<7.0+, iOS<7.0+, PhantomJS<1.9.8+
- if ( !el.querySelectorAll( "[id~=" + expando + "-]" ).length ) {
- rbuggyQSA.push("~=");
- }
- // Webkit/Opera - :checked should return selected option elements
- // http://www.w3.org/TR/2011/REC-css3-selectors-20110929/#checked
- // IE8 throws error here and will not see later tests
- if ( !el.querySelectorAll(":checked").length ) {
- rbuggyQSA.push(":checked");
- }
- // Support: Safari 8+, iOS 8+
- // https://bugs.webkit.org/show_bug.cgi?id=136851
- // In-page `selector#id sibling-combinator selector` fails
- if ( !el.querySelectorAll( "a#" + expando + "+*" ).length ) {
- rbuggyQSA.push(".#.+[+~]");
- }
- });
- assert(function( el ) {
- el.innerHTML = " " +
- " ";
- // Support: Windows 8 Native Apps
- // The type and name attributes are restricted during .innerHTML assignment
- var input = document.createElement("input");
- input.setAttribute( "type", "hidden" );
- el.appendChild( input ).setAttribute( "name", "D" );
- // Support: IE8
- // Enforce case-sensitivity of name attribute
- if ( el.querySelectorAll("[name=d]").length ) {
- rbuggyQSA.push( "name" + whitespace + "*[*^$|!~]?=" );
- }
- // FF 3.5 - :enabled/:disabled and hidden elements (hidden elements are still enabled)
- // IE8 throws error here and will not see later tests
- if ( el.querySelectorAll(":enabled").length !== 2 ) {
- rbuggyQSA.push( ":enabled", ":disabled" );
- }
- // Support: IE9-11+
- // IE's :disabled selector does not pick up the children of disabled fieldsets
- docElem.appendChild( el ).disabled = true;
- if ( el.querySelectorAll(":disabled").length !== 2 ) {
- rbuggyQSA.push( ":enabled", ":disabled" );
- }
- // Opera 10-11 does not throw on post-comma invalid pseudos
- el.querySelectorAll("*,:x");
- rbuggyQSA.push(",.*:");
- });
- }
- if ( (support.matchesSelector = rnative.test( (matches = docElem.matches ||
- docElem.webkitMatchesSelector ||
- docElem.mozMatchesSelector ||
- docElem.oMatchesSelector ||
- docElem.msMatchesSelector) )) ) {
- assert(function( el ) {
- // Check to see if it's possible to do matchesSelector
- // on a disconnected node (IE 9)
- support.disconnectedMatch = matches.call( el, "*" );
- // This should fail with an exception
- // Gecko does not error, returns false instead
- matches.call( el, "[s!='']:x" );
- rbuggyMatches.push( "!=", pseudos );
- });
- }
- rbuggyQSA = rbuggyQSA.length && new RegExp( rbuggyQSA.join("|") );
- rbuggyMatches = rbuggyMatches.length && new RegExp( rbuggyMatches.join("|") );
- /* Contains
- ---------------------------------------------------------------------- */
- hasCompare = rnative.test( docElem.compareDocumentPosition );
- // Element contains another
- // Purposefully self-exclusive
- // As in, an element does not contain itself
- contains = hasCompare || rnative.test( docElem.contains ) ?
- function( a, b ) {
- var adown = a.nodeType === 9 ? a.documentElement : a,
- bup = b && b.parentNode;
- return a === bup || !!( bup && bup.nodeType === 1 && (
- adown.contains ?
- adown.contains( bup ) :
- a.compareDocumentPosition && a.compareDocumentPosition( bup ) & 16
- ));
- } :
- function( a, b ) {
- if ( b ) {
- while ( (b = b.parentNode) ) {
- if ( b === a ) {
- return true;
- }
- }
- }
- return false;
- };
- /* Sorting
- ---------------------------------------------------------------------- */
- // Document order sorting
- sortOrder = hasCompare ?
- function( a, b ) {
- // Flag for duplicate removal
- if ( a === b ) {
- hasDuplicate = true;
- return 0;
- }
- // Sort on method existence if only one input has compareDocumentPosition
- var compare = !a.compareDocumentPosition - !b.compareDocumentPosition;
- if ( compare ) {
- return compare;
- }
- // Calculate position if both inputs belong to the same document
- compare = ( a.ownerDocument || a ) === ( b.ownerDocument || b ) ?
- a.compareDocumentPosition( b ) :
- // Otherwise we know they are disconnected
- 1;
- // Disconnected nodes
- if ( compare & 1 ||
- (!support.sortDetached && b.compareDocumentPosition( a ) === compare) ) {
- // Choose the first element that is related to our preferred document
- if ( a === document || a.ownerDocument === preferredDoc && contains(preferredDoc, a) ) {
- return -1;
- }
- if ( b === document || b.ownerDocument === preferredDoc && contains(preferredDoc, b) ) {
- return 1;
- }
- // Maintain original order
- return sortInput ?
- ( indexOf( sortInput, a ) - indexOf( sortInput, b ) ) :
- 0;
- }
- return compare & 4 ? -1 : 1;
- } :
- function( a, b ) {
- // Exit early if the nodes are identical
- if ( a === b ) {
- hasDuplicate = true;
- return 0;
- }
- var cur,
- i = 0,
- aup = a.parentNode,
- bup = b.parentNode,
- ap = [ a ],
- bp = [ b ];
- // Parentless nodes are either documents or disconnected
- if ( !aup || !bup ) {
- return a === document ? -1 :
- b === document ? 1 :
- aup ? -1 :
- bup ? 1 :
- sortInput ?
- ( indexOf( sortInput, a ) - indexOf( sortInput, b ) ) :
- 0;
- // If the nodes are siblings, we can do a quick check
- } else if ( aup === bup ) {
- return siblingCheck( a, b );
- }
- // Otherwise we need full lists of their ancestors for comparison
- cur = a;
- while ( (cur = cur.parentNode) ) {
- ap.unshift( cur );
- }
- cur = b;
- while ( (cur = cur.parentNode) ) {
- bp.unshift( cur );
- }
- // Walk down the tree looking for a discrepancy
- while ( ap[i] === bp[i] ) {
- i++;
- }
- return i ?
- // Do a sibling check if the nodes have a common ancestor
- siblingCheck( ap[i], bp[i] ) :
- // Otherwise nodes in our document sort first
- ap[i] === preferredDoc ? -1 :
- bp[i] === preferredDoc ? 1 :
- 0;
- };
- return document;
-Sizzle.matches = function( expr, elements ) {
- return Sizzle( expr, null, null, elements );
-Sizzle.matchesSelector = function( elem, expr ) {
- // Set document vars if needed
- if ( ( elem.ownerDocument || elem ) !== document ) {
- setDocument( elem );
- }
- if ( support.matchesSelector && documentIsHTML &&
- !nonnativeSelectorCache[ expr + " " ] &&
- ( !rbuggyMatches || !rbuggyMatches.test( expr ) ) &&
- ( !rbuggyQSA || !rbuggyQSA.test( expr ) ) ) {
- try {
- var ret = matches.call( elem, expr );
- // IE 9's matchesSelector returns false on disconnected nodes
- if ( ret || support.disconnectedMatch ||
- // As well, disconnected nodes are said to be in a document
- // fragment in IE 9
- elem.document && elem.document.nodeType !== 11 ) {
- return ret;
- }
- } catch (e) {
- nonnativeSelectorCache( expr, true );
- }
- }
- return Sizzle( expr, document, null, [ elem ] ).length > 0;
-Sizzle.contains = function( context, elem ) {
- // Set document vars if needed
- if ( ( context.ownerDocument || context ) !== document ) {
- setDocument( context );
- }
- return contains( context, elem );
-Sizzle.attr = function( elem, name ) {
- // Set document vars if needed
- if ( ( elem.ownerDocument || elem ) !== document ) {
- setDocument( elem );
- }
- var fn = Expr.attrHandle[ name.toLowerCase() ],
- // Don't get fooled by Object.prototype properties (jQuery #13807)
- val = fn && hasOwn.call( Expr.attrHandle, name.toLowerCase() ) ?
- fn( elem, name, !documentIsHTML ) :
- undefined;
- return val !== undefined ?
- val :
- support.attributes || !documentIsHTML ?
- elem.getAttribute( name ) :
- (val = elem.getAttributeNode(name)) && val.specified ?
- val.value :
- null;
-Sizzle.escape = function( sel ) {
- return (sel + "").replace( rcssescape, fcssescape );
-Sizzle.error = function( msg ) {
- throw new Error( "Syntax error, unrecognized expression: " + msg );
- * Document sorting and removing duplicates
- * @param {ArrayLike} results
- */
-Sizzle.uniqueSort = function( results ) {
- var elem,
- duplicates = [],
- j = 0,
- i = 0;
- // Unless we *know* we can detect duplicates, assume their presence
- hasDuplicate = !support.detectDuplicates;
- sortInput = !support.sortStable && results.slice( 0 );
- results.sort( sortOrder );
- if ( hasDuplicate ) {
- while ( (elem = results[i++]) ) {
- if ( elem === results[ i ] ) {
- j = duplicates.push( i );
- }
- }
- while ( j-- ) {
- results.splice( duplicates[ j ], 1 );
- }
- }
- // Clear input after sorting to release objects
- // See https://github.com/jquery/sizzle/pull/225
- sortInput = null;
- return results;
- * Utility function for retrieving the text value of an array of DOM nodes
- * @param {Array|Element} elem
- */
-getText = Sizzle.getText = function( elem ) {
- var node,
- ret = "",
- i = 0,
- nodeType = elem.nodeType;
- if ( !nodeType ) {
- // If no nodeType, this is expected to be an array
- while ( (node = elem[i++]) ) {
- // Do not traverse comment nodes
- ret += getText( node );
- }
- } else if ( nodeType === 1 || nodeType === 9 || nodeType === 11 ) {
- // Use textContent for elements
- // innerText usage removed for consistency of new lines (jQuery #11153)
- if ( typeof elem.textContent === "string" ) {
- return elem.textContent;
- } else {
- // Traverse its children
- for ( elem = elem.firstChild; elem; elem = elem.nextSibling ) {
- ret += getText( elem );
- }
- }
- } else if ( nodeType === 3 || nodeType === 4 ) {
- return elem.nodeValue;
- }
- // Do not include comment or processing instruction nodes
- return ret;
-Expr = Sizzle.selectors = {
- // Can be adjusted by the user
- cacheLength: 50,
- createPseudo: markFunction,
- match: matchExpr,
- attrHandle: {},
- find: {},
- relative: {
- ">": { dir: "parentNode", first: true },
- " ": { dir: "parentNode" },
- "+": { dir: "previousSibling", first: true },
- "~": { dir: "previousSibling" }
- },
- preFilter: {
- "ATTR": function( match ) {
- match[1] = match[1].replace( runescape, funescape );
- // Move the given value to match[3] whether quoted or unquoted
- match[3] = ( match[3] || match[4] || match[5] || "" ).replace( runescape, funescape );
- if ( match[2] === "~=" ) {
- match[3] = " " + match[3] + " ";
- }
- return match.slice( 0, 4 );
- },
- "CHILD": function( match ) {
- /* matches from matchExpr["CHILD"]
- 1 type (only|nth|...)
- 2 what (child|of-type)
- 3 argument (even|odd|\d*|\d*n([+-]\d+)?|...)
- 4 xn-component of xn+y argument ([+-]?\d*n|)
- 5 sign of xn-component
- 6 x of xn-component
- 7 sign of y-component
- 8 y of y-component
- */
- match[1] = match[1].toLowerCase();
- if ( match[1].slice( 0, 3 ) === "nth" ) {
- // nth-* requires argument
- if ( !match[3] ) {
- Sizzle.error( match[0] );
- }
- // numeric x and y parameters for Expr.filter.CHILD
- // remember that false/true cast respectively to 0/1
- match[4] = +( match[4] ? match[5] + (match[6] || 1) : 2 * ( match[3] === "even" || match[3] === "odd" ) );
- match[5] = +( ( match[7] + match[8] ) || match[3] === "odd" );
- // other types prohibit arguments
- } else if ( match[3] ) {
- Sizzle.error( match[0] );
- }
- return match;
- },
- "PSEUDO": function( match ) {
- var excess,
- unquoted = !match[6] && match[2];
- if ( matchExpr["CHILD"].test( match[0] ) ) {
- return null;
- }
- // Accept quoted arguments as-is
- if ( match[3] ) {
- match[2] = match[4] || match[5] || "";
- // Strip excess characters from unquoted arguments
- } else if ( unquoted && rpseudo.test( unquoted ) &&
- // Get excess from tokenize (recursively)
- (excess = tokenize( unquoted, true )) &&
- // advance to the next closing parenthesis
- (excess = unquoted.indexOf( ")", unquoted.length - excess ) - unquoted.length) ) {
- // excess is a negative index
- match[0] = match[0].slice( 0, excess );
- match[2] = unquoted.slice( 0, excess );
- }
- // Return only captures needed by the pseudo filter method (type and argument)
- return match.slice( 0, 3 );
- }
- },
- filter: {
- "TAG": function( nodeNameSelector ) {
- var nodeName = nodeNameSelector.replace( runescape, funescape ).toLowerCase();
- return nodeNameSelector === "*" ?
- function() { return true; } :
- function( elem ) {
- return elem.nodeName && elem.nodeName.toLowerCase() === nodeName;
- };
- },
- "CLASS": function( className ) {
- var pattern = classCache[ className + " " ];
- return pattern ||
- (pattern = new RegExp( "(^|" + whitespace + ")" + className + "(" + whitespace + "|$)" )) &&
- classCache( className, function( elem ) {
- return pattern.test( typeof elem.className === "string" && elem.className || typeof elem.getAttribute !== "undefined" && elem.getAttribute("class") || "" );
- });
- },
- "ATTR": function( name, operator, check ) {
- return function( elem ) {
- var result = Sizzle.attr( elem, name );
- if ( result == null ) {
- return operator === "!=";
- }
- if ( !operator ) {
- return true;
- }
- result += "";
- return operator === "=" ? result === check :
- operator === "!=" ? result !== check :
- operator === "^=" ? check && result.indexOf( check ) === 0 :
- operator === "*=" ? check && result.indexOf( check ) > -1 :
- operator === "$=" ? check && result.slice( -check.length ) === check :
- operator === "~=" ? ( " " + result.replace( rwhitespace, " " ) + " " ).indexOf( check ) > -1 :
- operator === "|=" ? result === check || result.slice( 0, check.length + 1 ) === check + "-" :
- false;
- };
- },
- "CHILD": function( type, what, argument, first, last ) {
- var simple = type.slice( 0, 3 ) !== "nth",
- forward = type.slice( -4 ) !== "last",
- ofType = what === "of-type";
- return first === 1 && last === 0 ?
- // Shortcut for :nth-*(n)
- function( elem ) {
- return !!elem.parentNode;
- } :
- function( elem, context, xml ) {
- var cache, uniqueCache, outerCache, node, nodeIndex, start,
- dir = simple !== forward ? "nextSibling" : "previousSibling",
- parent = elem.parentNode,
- name = ofType && elem.nodeName.toLowerCase(),
- useCache = !xml && !ofType,
- diff = false;
- if ( parent ) {
- // :(first|last|only)-(child|of-type)
- if ( simple ) {
- while ( dir ) {
- node = elem;
- while ( (node = node[ dir ]) ) {
- if ( ofType ?
- node.nodeName.toLowerCase() === name :
- node.nodeType === 1 ) {
- return false;
- }
- }
- // Reverse direction for :only-* (if we haven't yet done so)
- start = dir = type === "only" && !start && "nextSibling";
- }
- return true;
- }
- start = [ forward ? parent.firstChild : parent.lastChild ];
- // non-xml :nth-child(...) stores cache data on `parent`
- if ( forward && useCache ) {
- // Seek `elem` from a previously-cached index
- // ...in a gzip-friendly way
- node = parent;
- outerCache = node[ expando ] || (node[ expando ] = {});
- // Support: IE <9 only
- // Defend against cloned attroperties (jQuery gh-1709)
- uniqueCache = outerCache[ node.uniqueID ] ||
- (outerCache[ node.uniqueID ] = {});
- cache = uniqueCache[ type ] || [];
- nodeIndex = cache[ 0 ] === dirruns && cache[ 1 ];
- diff = nodeIndex && cache[ 2 ];
- node = nodeIndex && parent.childNodes[ nodeIndex ];
- while ( (node = ++nodeIndex && node && node[ dir ] ||
- // Fallback to seeking `elem` from the start
- (diff = nodeIndex = 0) || start.pop()) ) {
- // When found, cache indexes on `parent` and break
- if ( node.nodeType === 1 && ++diff && node === elem ) {
- uniqueCache[ type ] = [ dirruns, nodeIndex, diff ];
- break;
- }
- }
- } else {
- // Use previously-cached element index if available
- if ( useCache ) {
- // ...in a gzip-friendly way
- node = elem;
- outerCache = node[ expando ] || (node[ expando ] = {});
- // Support: IE <9 only
- // Defend against cloned attroperties (jQuery gh-1709)
- uniqueCache = outerCache[ node.uniqueID ] ||
- (outerCache[ node.uniqueID ] = {});
- cache = uniqueCache[ type ] || [];
- nodeIndex = cache[ 0 ] === dirruns && cache[ 1 ];
- diff = nodeIndex;
- }
- // xml :nth-child(...)
- // or :nth-last-child(...) or :nth(-last)?-of-type(...)
- if ( diff === false ) {
- // Use the same loop as above to seek `elem` from the start
- while ( (node = ++nodeIndex && node && node[ dir ] ||
- (diff = nodeIndex = 0) || start.pop()) ) {
- if ( ( ofType ?
- node.nodeName.toLowerCase() === name :
- node.nodeType === 1 ) &&
- ++diff ) {
- // Cache the index of each encountered element
- if ( useCache ) {
- outerCache = node[ expando ] || (node[ expando ] = {});
- // Support: IE <9 only
- // Defend against cloned attroperties (jQuery gh-1709)
- uniqueCache = outerCache[ node.uniqueID ] ||
- (outerCache[ node.uniqueID ] = {});
- uniqueCache[ type ] = [ dirruns, diff ];
- }
- if ( node === elem ) {
- break;
- }
- }
- }
- }
- }
- // Incorporate the offset, then check against cycle size
- diff -= last;
- return diff === first || ( diff % first === 0 && diff / first >= 0 );
- }
- };
- },
- "PSEUDO": function( pseudo, argument ) {
- // pseudo-class names are case-insensitive
- // http://www.w3.org/TR/selectors/#pseudo-classes
- // Prioritize by case sensitivity in case custom pseudos are added with uppercase letters
- // Remember that setFilters inherits from pseudos
- var args,
- fn = Expr.pseudos[ pseudo ] || Expr.setFilters[ pseudo.toLowerCase() ] ||
- Sizzle.error( "unsupported pseudo: " + pseudo );
- // The user may use createPseudo to indicate that
- // arguments are needed to create the filter function
- // just as Sizzle does
- if ( fn[ expando ] ) {
- return fn( argument );
- }
- // But maintain support for old signatures
- if ( fn.length > 1 ) {
- args = [ pseudo, pseudo, "", argument ];
- return Expr.setFilters.hasOwnProperty( pseudo.toLowerCase() ) ?
- markFunction(function( seed, matches ) {
- var idx,
- matched = fn( seed, argument ),
- i = matched.length;
- while ( i-- ) {
- idx = indexOf( seed, matched[i] );
- seed[ idx ] = !( matches[ idx ] = matched[i] );
- }
- }) :
- function( elem ) {
- return fn( elem, 0, args );
- };
- }
- return fn;
- }
- },
- pseudos: {
- // Potentially complex pseudos
- "not": markFunction(function( selector ) {
- // Trim the selector passed to compile
- // to avoid treating leading and trailing
- // spaces as combinators
- var input = [],
- results = [],
- matcher = compile( selector.replace( rtrim, "$1" ) );
- return matcher[ expando ] ?
- markFunction(function( seed, matches, context, xml ) {
- var elem,
- unmatched = matcher( seed, null, xml, [] ),
- i = seed.length;
- // Match elements unmatched by `matcher`
- while ( i-- ) {
- if ( (elem = unmatched[i]) ) {
- seed[i] = !(matches[i] = elem);
- }
- }
- }) :
- function( elem, context, xml ) {
- input[0] = elem;
- matcher( input, null, xml, results );
- // Don't keep the element (issue #299)
- input[0] = null;
- return !results.pop();
- };
- }),
- "has": markFunction(function( selector ) {
- return function( elem ) {
- return Sizzle( selector, elem ).length > 0;
- };
- }),
- "contains": markFunction(function( text ) {
- text = text.replace( runescape, funescape );
- return function( elem ) {
- return ( elem.textContent || getText( elem ) ).indexOf( text ) > -1;
- };
- }),
- // "Whether an element is represented by a :lang() selector
- // is based solely on the element's language value
- // being equal to the identifier C,
- // or beginning with the identifier C immediately followed by "-".
- // The matching of C against the element's language value is performed case-insensitively.
- // The identifier C does not have to be a valid language name."
- // http://www.w3.org/TR/selectors/#lang-pseudo
- "lang": markFunction( function( lang ) {
- // lang value must be a valid identifier
- if ( !ridentifier.test(lang || "") ) {
- Sizzle.error( "unsupported lang: " + lang );
- }
- lang = lang.replace( runescape, funescape ).toLowerCase();
- return function( elem ) {
- var elemLang;
- do {
- if ( (elemLang = documentIsHTML ?
- elem.lang :
- elem.getAttribute("xml:lang") || elem.getAttribute("lang")) ) {
- elemLang = elemLang.toLowerCase();
- return elemLang === lang || elemLang.indexOf( lang + "-" ) === 0;
- }
- } while ( (elem = elem.parentNode) && elem.nodeType === 1 );
- return false;
- };
- }),
- // Miscellaneous
- "target": function( elem ) {
- var hash = window.location && window.location.hash;
- return hash && hash.slice( 1 ) === elem.id;
- },
- "root": function( elem ) {
- return elem === docElem;
- },
- "focus": function( elem ) {
- return elem === document.activeElement && (!document.hasFocus || document.hasFocus()) && !!(elem.type || elem.href || ~elem.tabIndex);
- },
- // Boolean properties
- "enabled": createDisabledPseudo( false ),
- "disabled": createDisabledPseudo( true ),
- "checked": function( elem ) {
- // In CSS3, :checked should return both checked and selected elements
- // http://www.w3.org/TR/2011/REC-css3-selectors-20110929/#checked
- var nodeName = elem.nodeName.toLowerCase();
- return (nodeName === "input" && !!elem.checked) || (nodeName === "option" && !!elem.selected);
- },
- "selected": function( elem ) {
- // Accessing this property makes selected-by-default
- // options in Safari work properly
- if ( elem.parentNode ) {
- elem.parentNode.selectedIndex;
- }
- return elem.selected === true;
- },
- // Contents
- "empty": function( elem ) {
- // http://www.w3.org/TR/selectors/#empty-pseudo
- // :empty is negated by element (1) or content nodes (text: 3; cdata: 4; entity ref: 5),
- // but not by others (comment: 8; processing instruction: 7; etc.)
- // nodeType < 6 works because attributes (2) do not appear as children
- for ( elem = elem.firstChild; elem; elem = elem.nextSibling ) {
- if ( elem.nodeType < 6 ) {
- return false;
- }
- }
- return true;
- },
- "parent": function( elem ) {
- return !Expr.pseudos["empty"]( elem );
- },
- // Element/input types
- "header": function( elem ) {
- return rheader.test( elem.nodeName );
- },
- "input": function( elem ) {
- return rinputs.test( elem.nodeName );
- },
- "button": function( elem ) {
- var name = elem.nodeName.toLowerCase();
- return name === "input" && elem.type === "button" || name === "button";
- },
- "text": function( elem ) {
- var attr;
- return elem.nodeName.toLowerCase() === "input" &&
- elem.type === "text" &&
- // Support: IE<8
- // New HTML5 attribute values (e.g., "search") appear with elem.type === "text"
- ( (attr = elem.getAttribute("type")) == null || attr.toLowerCase() === "text" );
- },
- // Position-in-collection
- "first": createPositionalPseudo(function() {
- return [ 0 ];
- }),
- "last": createPositionalPseudo(function( matchIndexes, length ) {
- return [ length - 1 ];
- }),
- "eq": createPositionalPseudo(function( matchIndexes, length, argument ) {
- return [ argument < 0 ? argument + length : argument ];
- }),
- "even": createPositionalPseudo(function( matchIndexes, length ) {
- var i = 0;
- for ( ; i < length; i += 2 ) {
- matchIndexes.push( i );
- }
- return matchIndexes;
- }),
- "odd": createPositionalPseudo(function( matchIndexes, length ) {
- var i = 1;
- for ( ; i < length; i += 2 ) {
- matchIndexes.push( i );
- }
- return matchIndexes;
- }),
- "lt": createPositionalPseudo(function( matchIndexes, length, argument ) {
- var i = argument < 0 ?
- argument + length :
- argument > length ?
- length :
- argument;
- for ( ; --i >= 0; ) {
- matchIndexes.push( i );
- }
- return matchIndexes;
- }),
- "gt": createPositionalPseudo(function( matchIndexes, length, argument ) {
- var i = argument < 0 ? argument + length : argument;
- for ( ; ++i < length; ) {
- matchIndexes.push( i );
- }
- return matchIndexes;
- })
- }
-Expr.pseudos["nth"] = Expr.pseudos["eq"];
-// Add button/input type pseudos
-for ( i in { radio: true, checkbox: true, file: true, password: true, image: true } ) {
- Expr.pseudos[ i ] = createInputPseudo( i );
-for ( i in { submit: true, reset: true } ) {
- Expr.pseudos[ i ] = createButtonPseudo( i );
-// Easy API for creating new setFilters
-function setFilters() {}
-setFilters.prototype = Expr.filters = Expr.pseudos;
-Expr.setFilters = new setFilters();
-tokenize = Sizzle.tokenize = function( selector, parseOnly ) {
- var matched, match, tokens, type,
- soFar, groups, preFilters,
- cached = tokenCache[ selector + " " ];
- if ( cached ) {
- return parseOnly ? 0 : cached.slice( 0 );
- }
- soFar = selector;
- groups = [];
- preFilters = Expr.preFilter;
- while ( soFar ) {
- // Comma and first run
- if ( !matched || (match = rcomma.exec( soFar )) ) {
- if ( match ) {
- // Don't consume trailing commas as valid
- soFar = soFar.slice( match[0].length ) || soFar;
- }
- groups.push( (tokens = []) );
- }
- matched = false;
- // Combinators
- if ( (match = rcombinators.exec( soFar )) ) {
- matched = match.shift();
- tokens.push({
- value: matched,
- // Cast descendant combinators to space
- type: match[0].replace( rtrim, " " )
- });
- soFar = soFar.slice( matched.length );
- }
- // Filters
- for ( type in Expr.filter ) {
- if ( (match = matchExpr[ type ].exec( soFar )) && (!preFilters[ type ] ||
- (match = preFilters[ type ]( match ))) ) {
- matched = match.shift();
- tokens.push({
- value: matched,
- type: type,
- matches: match
- });
- soFar = soFar.slice( matched.length );
- }
- }
- if ( !matched ) {
- break;
- }
- }
- // Return the length of the invalid excess
- // if we're just parsing
- // Otherwise, throw an error or return tokens
- return parseOnly ?
- soFar.length :
- soFar ?
- Sizzle.error( selector ) :
- // Cache the tokens
- tokenCache( selector, groups ).slice( 0 );
-function toSelector( tokens ) {
- var i = 0,
- len = tokens.length,
- selector = "";
- for ( ; i < len; i++ ) {
- selector += tokens[i].value;
- }
- return selector;
-function addCombinator( matcher, combinator, base ) {
- var dir = combinator.dir,
- skip = combinator.next,
- key = skip || dir,
- checkNonElements = base && key === "parentNode",
- doneName = done++;
- return combinator.first ?
- // Check against closest ancestor/preceding element
- function( elem, context, xml ) {
- while ( (elem = elem[ dir ]) ) {
- if ( elem.nodeType === 1 || checkNonElements ) {
- return matcher( elem, context, xml );
- }
- }
- return false;
- } :
- // Check against all ancestor/preceding elements
- function( elem, context, xml ) {
- var oldCache, uniqueCache, outerCache,
- newCache = [ dirruns, doneName ];
- // We can't set arbitrary data on XML nodes, so they don't benefit from combinator caching
- if ( xml ) {
- while ( (elem = elem[ dir ]) ) {
- if ( elem.nodeType === 1 || checkNonElements ) {
- if ( matcher( elem, context, xml ) ) {
- return true;
- }
- }
- }
- } else {
- while ( (elem = elem[ dir ]) ) {
- if ( elem.nodeType === 1 || checkNonElements ) {
- outerCache = elem[ expando ] || (elem[ expando ] = {});
- // Support: IE <9 only
- // Defend against cloned attroperties (jQuery gh-1709)
- uniqueCache = outerCache[ elem.uniqueID ] || (outerCache[ elem.uniqueID ] = {});
- if ( skip && skip === elem.nodeName.toLowerCase() ) {
- elem = elem[ dir ] || elem;
- } else if ( (oldCache = uniqueCache[ key ]) &&
- oldCache[ 0 ] === dirruns && oldCache[ 1 ] === doneName ) {
- // Assign to newCache so results back-propagate to previous elements
- return (newCache[ 2 ] = oldCache[ 2 ]);
- } else {
- // Reuse newcache so results back-propagate to previous elements
- uniqueCache[ key ] = newCache;
- // A match means we're done; a fail means we have to keep checking
- if ( (newCache[ 2 ] = matcher( elem, context, xml )) ) {
- return true;
- }
- }
- }
- }
- }
- return false;
- };
-function elementMatcher( matchers ) {
- return matchers.length > 1 ?
- function( elem, context, xml ) {
- var i = matchers.length;
- while ( i-- ) {
- if ( !matchers[i]( elem, context, xml ) ) {
- return false;
- }
- }
- return true;
- } :
- matchers[0];
-function multipleContexts( selector, contexts, results ) {
- var i = 0,
- len = contexts.length;
- for ( ; i < len; i++ ) {
- Sizzle( selector, contexts[i], results );
- }
- return results;
-function condense( unmatched, map, filter, context, xml ) {
- var elem,
- newUnmatched = [],
- i = 0,
- len = unmatched.length,
- mapped = map != null;
- for ( ; i < len; i++ ) {
- if ( (elem = unmatched[i]) ) {
- if ( !filter || filter( elem, context, xml ) ) {
- newUnmatched.push( elem );
- if ( mapped ) {
- map.push( i );
- }
- }
- }
- }
- return newUnmatched;
-function setMatcher( preFilter, selector, matcher, postFilter, postFinder, postSelector ) {
- if ( postFilter && !postFilter[ expando ] ) {
- postFilter = setMatcher( postFilter );
- }
- if ( postFinder && !postFinder[ expando ] ) {
- postFinder = setMatcher( postFinder, postSelector );
- }
- return markFunction(function( seed, results, context, xml ) {
- var temp, i, elem,
- preMap = [],
- postMap = [],
- preexisting = results.length,
- // Get initial elements from seed or context
- elems = seed || multipleContexts( selector || "*", context.nodeType ? [ context ] : context, [] ),
- // Prefilter to get matcher input, preserving a map for seed-results synchronization
- matcherIn = preFilter && ( seed || !selector ) ?
- condense( elems, preMap, preFilter, context, xml ) :
- elems,
- matcherOut = matcher ?
- // If we have a postFinder, or filtered seed, or non-seed postFilter or preexisting results,
- postFinder || ( seed ? preFilter : preexisting || postFilter ) ?
- // ...intermediate processing is necessary
- [] :
- // ...otherwise use results directly
- results :
- matcherIn;
- // Find primary matches
- if ( matcher ) {
- matcher( matcherIn, matcherOut, context, xml );
- }
- // Apply postFilter
- if ( postFilter ) {
- temp = condense( matcherOut, postMap );
- postFilter( temp, [], context, xml );
- // Un-match failing elements by moving them back to matcherIn
- i = temp.length;
- while ( i-- ) {
- if ( (elem = temp[i]) ) {
- matcherOut[ postMap[i] ] = !(matcherIn[ postMap[i] ] = elem);
- }
- }
- }
- if ( seed ) {
- if ( postFinder || preFilter ) {
- if ( postFinder ) {
- // Get the final matcherOut by condensing this intermediate into postFinder contexts
- temp = [];
- i = matcherOut.length;
- while ( i-- ) {
- if ( (elem = matcherOut[i]) ) {
- // Restore matcherIn since elem is not yet a final match
- temp.push( (matcherIn[i] = elem) );
- }
- }
- postFinder( null, (matcherOut = []), temp, xml );
- }
- // Move matched elements from seed to results to keep them synchronized
- i = matcherOut.length;
- while ( i-- ) {
- if ( (elem = matcherOut[i]) &&
- (temp = postFinder ? indexOf( seed, elem ) : preMap[i]) > -1 ) {
- seed[temp] = !(results[temp] = elem);
- }
- }
- }
- // Add elements to results, through postFinder if defined
- } else {
- matcherOut = condense(
- matcherOut === results ?
- matcherOut.splice( preexisting, matcherOut.length ) :
- matcherOut
- );
- if ( postFinder ) {
- postFinder( null, results, matcherOut, xml );
- } else {
- push.apply( results, matcherOut );
- }
- }
- });
-function matcherFromTokens( tokens ) {
- var checkContext, matcher, j,
- len = tokens.length,
- leadingRelative = Expr.relative[ tokens[0].type ],
- implicitRelative = leadingRelative || Expr.relative[" "],
- i = leadingRelative ? 1 : 0,
- // The foundational matcher ensures that elements are reachable from top-level context(s)
- matchContext = addCombinator( function( elem ) {
- return elem === checkContext;
- }, implicitRelative, true ),
- matchAnyContext = addCombinator( function( elem ) {
- return indexOf( checkContext, elem ) > -1;
- }, implicitRelative, true ),
- matchers = [ function( elem, context, xml ) {
- var ret = ( !leadingRelative && ( xml || context !== outermostContext ) ) || (
- (checkContext = context).nodeType ?
- matchContext( elem, context, xml ) :
- matchAnyContext( elem, context, xml ) );
- // Avoid hanging onto element (issue #299)
- checkContext = null;
- return ret;
- } ];
- for ( ; i < len; i++ ) {
- if ( (matcher = Expr.relative[ tokens[i].type ]) ) {
- matchers = [ addCombinator(elementMatcher( matchers ), matcher) ];
- } else {
- matcher = Expr.filter[ tokens[i].type ].apply( null, tokens[i].matches );
- // Return special upon seeing a positional matcher
- if ( matcher[ expando ] ) {
- // Find the next relative operator (if any) for proper handling
- j = ++i;
- for ( ; j < len; j++ ) {
- if ( Expr.relative[ tokens[j].type ] ) {
- break;
- }
- }
- return setMatcher(
- i > 1 && elementMatcher( matchers ),
- i > 1 && toSelector(
- // If the preceding token was a descendant combinator, insert an implicit any-element `*`
- tokens.slice( 0, i - 1 ).concat({ value: tokens[ i - 2 ].type === " " ? "*" : "" })
- ).replace( rtrim, "$1" ),
- matcher,
- i < j && matcherFromTokens( tokens.slice( i, j ) ),
- j < len && matcherFromTokens( (tokens = tokens.slice( j )) ),
- j < len && toSelector( tokens )
- );
- }
- matchers.push( matcher );
- }
- }
- return elementMatcher( matchers );
-function matcherFromGroupMatchers( elementMatchers, setMatchers ) {
- var bySet = setMatchers.length > 0,
- byElement = elementMatchers.length > 0,
- superMatcher = function( seed, context, xml, results, outermost ) {
- var elem, j, matcher,
- matchedCount = 0,
- i = "0",
- unmatched = seed && [],
- setMatched = [],
- contextBackup = outermostContext,
- // We must always have either seed elements or outermost context
- elems = seed || byElement && Expr.find["TAG"]( "*", outermost ),
- // Use integer dirruns iff this is the outermost matcher
- dirrunsUnique = (dirruns += contextBackup == null ? 1 : Math.random() || 0.1),
- len = elems.length;
- if ( outermost ) {
- outermostContext = context === document || context || outermost;
- }
- // Add elements passing elementMatchers directly to results
- // Support: IE<9, Safari
- // Tolerate NodeList properties (IE: "length"; Safari: ) matching elements by id
- for ( ; i !== len && (elem = elems[i]) != null; i++ ) {
- if ( byElement && elem ) {
- j = 0;
- if ( !context && elem.ownerDocument !== document ) {
- setDocument( elem );
- xml = !documentIsHTML;
- }
- while ( (matcher = elementMatchers[j++]) ) {
- if ( matcher( elem, context || document, xml) ) {
- results.push( elem );
- break;
- }
- }
- if ( outermost ) {
- dirruns = dirrunsUnique;
- }
- }
- // Track unmatched elements for set filters
- if ( bySet ) {
- // They will have gone through all possible matchers
- if ( (elem = !matcher && elem) ) {
- matchedCount--;
- }
- // Lengthen the array for every element, matched or not
- if ( seed ) {
- unmatched.push( elem );
- }
- }
- }
- // `i` is now the count of elements visited above, and adding it to `matchedCount`
- // makes the latter nonnegative.
- matchedCount += i;
- // Apply set filters to unmatched elements
- // NOTE: This can be skipped if there are no unmatched elements (i.e., `matchedCount`
- // equals `i`), unless we didn't visit _any_ elements in the above loop because we have
- // no element matchers and no seed.
- // Incrementing an initially-string "0" `i` allows `i` to remain a string only in that
- // case, which will result in a "00" `matchedCount` that differs from `i` but is also
- // numerically zero.
- if ( bySet && i !== matchedCount ) {
- j = 0;
- while ( (matcher = setMatchers[j++]) ) {
- matcher( unmatched, setMatched, context, xml );
- }
- if ( seed ) {
- // Reintegrate element matches to eliminate the need for sorting
- if ( matchedCount > 0 ) {
- while ( i-- ) {
- if ( !(unmatched[i] || setMatched[i]) ) {
- setMatched[i] = pop.call( results );
- }
- }
- }
- // Discard index placeholder values to get only actual matches
- setMatched = condense( setMatched );
- }
- // Add matches to results
- push.apply( results, setMatched );
- // Seedless set matches succeeding multiple successful matchers stipulate sorting
- if ( outermost && !seed && setMatched.length > 0 &&
- ( matchedCount + setMatchers.length ) > 1 ) {
- Sizzle.uniqueSort( results );
- }
- }
- // Override manipulation of globals by nested matchers
- if ( outermost ) {
- dirruns = dirrunsUnique;
- outermostContext = contextBackup;
- }
- return unmatched;
- };
- return bySet ?
- markFunction( superMatcher ) :
- superMatcher;
-compile = Sizzle.compile = function( selector, match /* Internal Use Only */ ) {
- var i,
- setMatchers = [],
- elementMatchers = [],
- cached = compilerCache[ selector + " " ];
- if ( !cached ) {
- // Generate a function of recursive functions that can be used to check each element
- if ( !match ) {
- match = tokenize( selector );
- }
- i = match.length;
- while ( i-- ) {
- cached = matcherFromTokens( match[i] );
- if ( cached[ expando ] ) {
- setMatchers.push( cached );
- } else {
- elementMatchers.push( cached );
- }
- }
- // Cache the compiled function
- cached = compilerCache( selector, matcherFromGroupMatchers( elementMatchers, setMatchers ) );
- // Save selector and tokenization
- cached.selector = selector;
- }
- return cached;
- * A low-level selection function that works with Sizzle's compiled
- * selector functions
- * @param {String|Function} selector A selector or a pre-compiled
- * selector function built with Sizzle.compile
- * @param {Element} context
- * @param {Array} [results]
- * @param {Array} [seed] A set of elements to match against
- */
-select = Sizzle.select = function( selector, context, results, seed ) {
- var i, tokens, token, type, find,
- compiled = typeof selector === "function" && selector,
- match = !seed && tokenize( (selector = compiled.selector || selector) );
- results = results || [];
- // Try to minimize operations if there is only one selector in the list and no seed
- // (the latter of which guarantees us context)
- if ( match.length === 1 ) {
- // Reduce context if the leading compound selector is an ID
- tokens = match[0] = match[0].slice( 0 );
- if ( tokens.length > 2 && (token = tokens[0]).type === "ID" &&
- context.nodeType === 9 && documentIsHTML && Expr.relative[ tokens[1].type ] ) {
- context = ( Expr.find["ID"]( token.matches[0].replace(runescape, funescape), context ) || [] )[0];
- if ( !context ) {
- return results;
- // Precompiled matchers will still verify ancestry, so step up a level
- } else if ( compiled ) {
- context = context.parentNode;
- }
- selector = selector.slice( tokens.shift().value.length );
- }
- // Fetch a seed set for right-to-left matching
- i = matchExpr["needsContext"].test( selector ) ? 0 : tokens.length;
- while ( i-- ) {
- token = tokens[i];
- // Abort if we hit a combinator
- if ( Expr.relative[ (type = token.type) ] ) {
- break;
- }
- if ( (find = Expr.find[ type ]) ) {
- // Search, expanding context for leading sibling combinators
- if ( (seed = find(
- token.matches[0].replace( runescape, funescape ),
- rsibling.test( tokens[0].type ) && testContext( context.parentNode ) || context
- )) ) {
- // If seed is empty or no tokens remain, we can return early
- tokens.splice( i, 1 );
- selector = seed.length && toSelector( tokens );
- if ( !selector ) {
- push.apply( results, seed );
- return results;
- }
- break;
- }
- }
- }
- }
- // Compile and execute a filtering function if one is not provided
- // Provide `match` to avoid retokenization if we modified the selector above
- ( compiled || compile( selector, match ) )(
- seed,
- context,
- !documentIsHTML,
- results,
- !context || rsibling.test( selector ) && testContext( context.parentNode ) || context
- );
- return results;
-// One-time assignments
-// Sort stability
-support.sortStable = expando.split("").sort( sortOrder ).join("") === expando;
-// Support: Chrome 14-35+
-// Always assume duplicates if they aren't passed to the comparison function
-support.detectDuplicates = !!hasDuplicate;
-// Initialize against the default document
-// Support: Webkit<537.32 - Safari 6.0.3/Chrome 25 (fixed in Chrome 27)
-// Detached nodes confoundingly follow *each other*
-support.sortDetached = assert(function( el ) {
- // Should return 1, but returns 4 (following)
- return el.compareDocumentPosition( document.createElement("fieldset") ) & 1;
-// Support: IE<8
-// Prevent attribute/property "interpolation"
-// https://msdn.microsoft.com/en-us/library/ms536429%28VS.85%29.aspx
-if ( !assert(function( el ) {
- el.innerHTML = " ";
- return el.firstChild.getAttribute("href") === "#" ;
-}) ) {
- addHandle( "type|href|height|width", function( elem, name, isXML ) {
- if ( !isXML ) {
- return elem.getAttribute( name, name.toLowerCase() === "type" ? 1 : 2 );
- }
- });
-// Support: IE<9
-// Use defaultValue in place of getAttribute("value")
-if ( !support.attributes || !assert(function( el ) {
- el.innerHTML = " ";
- el.firstChild.setAttribute( "value", "" );
- return el.firstChild.getAttribute( "value" ) === "";
-}) ) {
- addHandle( "value", function( elem, name, isXML ) {
- if ( !isXML && elem.nodeName.toLowerCase() === "input" ) {
- return elem.defaultValue;
- }
- });
-// Support: IE<9
-// Use getAttributeNode to fetch booleans when getAttribute lies
-if ( !assert(function( el ) {
- return el.getAttribute("disabled") == null;
-}) ) {
- addHandle( booleans, function( elem, name, isXML ) {
- var val;
- if ( !isXML ) {
- return elem[ name ] === true ? name.toLowerCase() :
- (val = elem.getAttributeNode( name )) && val.specified ?
- val.value :
- null;
- }
- });
-return Sizzle;
-})( window );
-jQuery.find = Sizzle;
-jQuery.expr = Sizzle.selectors;
-// Deprecated
-jQuery.expr[ ":" ] = jQuery.expr.pseudos;
-jQuery.uniqueSort = jQuery.unique = Sizzle.uniqueSort;
-jQuery.text = Sizzle.getText;
-jQuery.isXMLDoc = Sizzle.isXML;
-jQuery.contains = Sizzle.contains;
-jQuery.escapeSelector = Sizzle.escape;
-var dir = function( elem, dir, until ) {
- var matched = [],
- truncate = until !== undefined;
- while ( ( elem = elem[ dir ] ) && elem.nodeType !== 9 ) {
- if ( elem.nodeType === 1 ) {
- if ( truncate && jQuery( elem ).is( until ) ) {
- break;
- }
- matched.push( elem );
- }
- }
- return matched;
-var siblings = function( n, elem ) {
- var matched = [];
- for ( ; n; n = n.nextSibling ) {
- if ( n.nodeType === 1 && n !== elem ) {
- matched.push( n );
- }
- }
- return matched;
-var rneedsContext = jQuery.expr.match.needsContext;
-function nodeName( elem, name ) {
- return elem.nodeName && elem.nodeName.toLowerCase() === name.toLowerCase();
-var rsingleTag = ( /^<([a-z][^\/\0>:\x20\t\r\n\f]*)[\x20\t\r\n\f]*\/?>(?:<\/\1>|)$/i );
-// Implement the identical functionality for filter and not
-function winnow( elements, qualifier, not ) {
- if ( isFunction( qualifier ) ) {
- return jQuery.grep( elements, function( elem, i ) {
- return !!qualifier.call( elem, i, elem ) !== not;
- } );
- }
- // Single element
- if ( qualifier.nodeType ) {
- return jQuery.grep( elements, function( elem ) {
- return ( elem === qualifier ) !== not;
- } );
- }
- // Arraylike of elements (jQuery, arguments, Array)
- if ( typeof qualifier !== "string" ) {
- return jQuery.grep( elements, function( elem ) {
- return ( indexOf.call( qualifier, elem ) > -1 ) !== not;
- } );
- }
- // Filtered directly for both simple and complex selectors
- return jQuery.filter( qualifier, elements, not );
-jQuery.filter = function( expr, elems, not ) {
- var elem = elems[ 0 ];
- if ( not ) {
- expr = ":not(" + expr + ")";
- }
- if ( elems.length === 1 && elem.nodeType === 1 ) {
- return jQuery.find.matchesSelector( elem, expr ) ? [ elem ] : [];
- }
- return jQuery.find.matches( expr, jQuery.grep( elems, function( elem ) {
- return elem.nodeType === 1;
- } ) );
-jQuery.fn.extend( {
- find: function( selector ) {
- var i, ret,
- len = this.length,
- self = this;
- if ( typeof selector !== "string" ) {
- return this.pushStack( jQuery( selector ).filter( function() {
- for ( i = 0; i < len; i++ ) {
- if ( jQuery.contains( self[ i ], this ) ) {
- return true;
- }
- }
- } ) );
- }
- ret = this.pushStack( [] );
- for ( i = 0; i < len; i++ ) {
- jQuery.find( selector, self[ i ], ret );
- }
- return len > 1 ? jQuery.uniqueSort( ret ) : ret;
- },
- filter: function( selector ) {
- return this.pushStack( winnow( this, selector || [], false ) );
- },
- not: function( selector ) {
- return this.pushStack( winnow( this, selector || [], true ) );
- },
- is: function( selector ) {
- return !!winnow(
- this,
- // If this is a positional/relative selector, check membership in the returned set
- // so $("p:first").is("p:last") won't return true for a doc with two "p".
- typeof selector === "string" && rneedsContext.test( selector ) ?
- jQuery( selector ) :
- selector || [],
- false
- ).length;
- }
-} );
-// Initialize a jQuery object
-// A central reference to the root jQuery(document)
-var rootjQuery,
- // A simple way to check for HTML strings
- // Prioritize #id over to avoid XSS via location.hash (#9521)
- // Strict HTML recognition (#11290: must start with <)
- // Shortcut simple #id case for speed
- rquickExpr = /^(?:\s*(<[\w\W]+>)[^>]*|#([\w-]+))$/,
- init = jQuery.fn.init = function( selector, context, root ) {
- var match, elem;
- // HANDLE: $(""), $(null), $(undefined), $(false)
- if ( !selector ) {
- return this;
- }
- // Method init() accepts an alternate rootjQuery
- // so migrate can support jQuery.sub (gh-2101)
- root = root || rootjQuery;
- // Handle HTML strings
- if ( typeof selector === "string" ) {
- if ( selector[ 0 ] === "<" &&
- selector[ selector.length - 1 ] === ">" &&
- selector.length >= 3 ) {
- // Assume that strings that start and end with <> are HTML and skip the regex check
- match = [ null, selector, null ];
- } else {
- match = rquickExpr.exec( selector );
- }
- // Match html or make sure no context is specified for #id
- if ( match && ( match[ 1 ] || !context ) ) {
- // HANDLE: $(html) -> $(array)
- if ( match[ 1 ] ) {
- context = context instanceof jQuery ? context[ 0 ] : context;
- // Option to run scripts is true for back-compat
- // Intentionally let the error be thrown if parseHTML is not present
- jQuery.merge( this, jQuery.parseHTML(
- match[ 1 ],
- context && context.nodeType ? context.ownerDocument || context : document,
- true
- ) );
- // HANDLE: $(html, props)
- if ( rsingleTag.test( match[ 1 ] ) && jQuery.isPlainObject( context ) ) {
- for ( match in context ) {
- // Properties of context are called as methods if possible
- if ( isFunction( this[ match ] ) ) {
- this[ match ]( context[ match ] );
- // ...and otherwise set as attributes
- } else {
- this.attr( match, context[ match ] );
- }
- }
- }
- return this;
- // HANDLE: $(#id)
- } else {
- elem = document.getElementById( match[ 2 ] );
- if ( elem ) {
- // Inject the element directly into the jQuery object
- this[ 0 ] = elem;
- this.length = 1;
- }
- return this;
- }
- // HANDLE: $(expr, $(...))
- } else if ( !context || context.jquery ) {
- return ( context || root ).find( selector );
- // HANDLE: $(expr, context)
- // (which is just equivalent to: $(context).find(expr)
- } else {
- return this.constructor( context ).find( selector );
- }
- // HANDLE: $(DOMElement)
- } else if ( selector.nodeType ) {
- this[ 0 ] = selector;
- this.length = 1;
- return this;
- // HANDLE: $(function)
- // Shortcut for document ready
- } else if ( isFunction( selector ) ) {
- return root.ready !== undefined ?
- root.ready( selector ) :
- // Execute immediately if ready is not present
- selector( jQuery );
- }
- return jQuery.makeArray( selector, this );
- };
-// Give the init function the jQuery prototype for later instantiation
-init.prototype = jQuery.fn;
-// Initialize central reference
-rootjQuery = jQuery( document );
-var rparentsprev = /^(?:parents|prev(?:Until|All))/,
- // Methods guaranteed to produce a unique set when starting from a unique set
- guaranteedUnique = {
- children: true,
- contents: true,
- next: true,
- prev: true
- };
-jQuery.fn.extend( {
- has: function( target ) {
- var targets = jQuery( target, this ),
- l = targets.length;
- return this.filter( function() {
- var i = 0;
- for ( ; i < l; i++ ) {
- if ( jQuery.contains( this, targets[ i ] ) ) {
- return true;
- }
- }
- } );
- },
- closest: function( selectors, context ) {
- var cur,
- i = 0,
- l = this.length,
- matched = [],
- targets = typeof selectors !== "string" && jQuery( selectors );
- // Positional selectors never match, since there's no _selection_ context
- if ( !rneedsContext.test( selectors ) ) {
- for ( ; i < l; i++ ) {
- for ( cur = this[ i ]; cur && cur !== context; cur = cur.parentNode ) {
- // Always skip document fragments
- if ( cur.nodeType < 11 && ( targets ?
- targets.index( cur ) > -1 :
- // Don't pass non-elements to Sizzle
- cur.nodeType === 1 &&
- jQuery.find.matchesSelector( cur, selectors ) ) ) {
- matched.push( cur );
- break;
- }
- }
- }
- }
- return this.pushStack( matched.length > 1 ? jQuery.uniqueSort( matched ) : matched );
- },
- // Determine the position of an element within the set
- index: function( elem ) {
- // No argument, return index in parent
- if ( !elem ) {
- return ( this[ 0 ] && this[ 0 ].parentNode ) ? this.first().prevAll().length : -1;
- }
- // Index in selector
- if ( typeof elem === "string" ) {
- return indexOf.call( jQuery( elem ), this[ 0 ] );
- }
- // Locate the position of the desired element
- return indexOf.call( this,
- // If it receives a jQuery object, the first element is used
- elem.jquery ? elem[ 0 ] : elem
- );
- },
- add: function( selector, context ) {
- return this.pushStack(
- jQuery.uniqueSort(
- jQuery.merge( this.get(), jQuery( selector, context ) )
- )
- );
- },
- addBack: function( selector ) {
- return this.add( selector == null ?
- this.prevObject : this.prevObject.filter( selector )
- );
- }
-} );
-function sibling( cur, dir ) {
- while ( ( cur = cur[ dir ] ) && cur.nodeType !== 1 ) {}
- return cur;
-jQuery.each( {
- parent: function( elem ) {
- var parent = elem.parentNode;
- return parent && parent.nodeType !== 11 ? parent : null;
- },
- parents: function( elem ) {
- return dir( elem, "parentNode" );
- },
- parentsUntil: function( elem, i, until ) {
- return dir( elem, "parentNode", until );
- },
- next: function( elem ) {
- return sibling( elem, "nextSibling" );
- },
- prev: function( elem ) {
- return sibling( elem, "previousSibling" );
- },
- nextAll: function( elem ) {
- return dir( elem, "nextSibling" );
- },
- prevAll: function( elem ) {
- return dir( elem, "previousSibling" );
- },
- nextUntil: function( elem, i, until ) {
- return dir( elem, "nextSibling", until );
- },
- prevUntil: function( elem, i, until ) {
- return dir( elem, "previousSibling", until );
- },
- siblings: function( elem ) {
- return siblings( ( elem.parentNode || {} ).firstChild, elem );
- },
- children: function( elem ) {
- return siblings( elem.firstChild );
- },
- contents: function( elem ) {
- if ( typeof elem.contentDocument !== "undefined" ) {
- return elem.contentDocument;
- }
- // Support: IE 9 - 11 only, iOS 7 only, Android Browser <=4.3 only
- // Treat the template element as a regular one in browsers that
- // don't support it.
- if ( nodeName( elem, "template" ) ) {
- elem = elem.content || elem;
- }
- return jQuery.merge( [], elem.childNodes );
- }
-}, function( name, fn ) {
- jQuery.fn[ name ] = function( until, selector ) {
- var matched = jQuery.map( this, fn, until );
- if ( name.slice( -5 ) !== "Until" ) {
- selector = until;
- }
- if ( selector && typeof selector === "string" ) {
- matched = jQuery.filter( selector, matched );
- }
- if ( this.length > 1 ) {
- // Remove duplicates
- if ( !guaranteedUnique[ name ] ) {
- jQuery.uniqueSort( matched );
- }
- // Reverse order for parents* and prev-derivatives
- if ( rparentsprev.test( name ) ) {
- matched.reverse();
- }
- }
- return this.pushStack( matched );
- };
-} );
-var rnothtmlwhite = ( /[^\x20\t\r\n\f]+/g );
-// Convert String-formatted options into Object-formatted ones
-function createOptions( options ) {
- var object = {};
- jQuery.each( options.match( rnothtmlwhite ) || [], function( _, flag ) {
- object[ flag ] = true;
- } );
- return object;
- * Create a callback list using the following parameters:
- *
- * options: an optional list of space-separated options that will change how
- * the callback list behaves or a more traditional option object
- *
- * By default a callback list will act like an event callback list and can be
- * "fired" multiple times.
- *
- * Possible options:
- *
- * once: will ensure the callback list can only be fired once (like a Deferred)
diff --git a/src/test/java/org/grobid/core/data/material/FormulaTest.java b/src/test/java/org/grobid/core/data/material/FormulaTest.java
index c6776e56..b73ad804 100644
--- a/src/test/java/org/grobid/core/data/material/FormulaTest.java
+++ b/src/test/java/org/grobid/core/data/material/FormulaTest.java
@@ -1,29 +1,28 @@
package org.grobid.core.data.material;
+import org.junit.jupiter.api.Assertions;
import org.junit.jupiter.api.Test;
import java.util.Map;
-import static org.assertj.core.api.Assertions.assertThat;
class FormulaTest {
void testEquals_onlyRawValue_shouldReturnTrue() {
Formula formula1 = new Formula("La 3 A 1 R 2");
Formula formula2 = new Formula("La 3 A 1 R 2");
- assertThat(formula1.equals(formula2));
+ Assertions.assertEquals(formula1, formula2);
void testEquals_onlyRawValue_shouldReturnFalse() {
Formula formula1 = new Formula("La 3 A 1 R 2");
Formula formula2 = new Formula("La 3 A 2 R 2");
- assertThat(formula1.equals(formula2));
+ Assertions.assertEquals(formula1, formula2);
@@ -33,7 +32,7 @@ void testEquals_onlyComposition_shouldReturnTrue() {
Formula formula2 = new Formula();
formula2.setFormulaComposition(Map.of("Fe", "3", "La", "2"));
- assertThat(formula1.equals(formula2));
+ Assertions.assertEquals(formula1, formula2);
@@ -44,7 +43,7 @@ void testEquals_onlyComposition_shouldReturnFalse() {
Formula formula2 = new Formula();
formula2.setFormulaComposition(Map.of("La", "3", "Fe", "3"));
- assertThat(formula1.equals(formula2));
+ Assertions.assertNotEquals(formula1, formula2);
\ No newline at end of file
diff --git a/src/test/java/org/grobid/core/engines/training/SuperconductorsTrainingXMLFormatterTest.java b/src/test/java/org/grobid/core/engines/training/SuperconductorsTrainingXMLFormatterTest.java
index 858e2d3c..168a636a 100644
--- a/src/test/java/org/grobid/core/engines/training/SuperconductorsTrainingXMLFormatterTest.java
+++ b/src/test/java/org/grobid/core/engines/training/SuperconductorsTrainingXMLFormatterTest.java
@@ -6,15 +6,18 @@
import org.grobid.core.data.document.DocumentBlock;
import org.grobid.core.data.document.Span;
import org.grobid.core.layout.LayoutToken;
+import org.grobid.core.utilities.AdditionalLayoutTokensUtil;
+import org.grobid.core.utilities.OffsetPosition;
import org.junit.Before;
import org.junit.Test;
import java.util.ArrayList;
+import java.util.Arrays;
import java.util.List;
+import static org.grobid.core.document.xml.XmlBuilderUtils.teiElement;
import static org.grobid.core.engines.label.SuperconductorsTaggingLabels.*;
-import static org.hamcrest.CoreMatchers.endsWith;
-import static org.hamcrest.CoreMatchers.is;
+import static org.hamcrest.CoreMatchers.*;
import static org.hamcrest.MatcherAssert.assertThat;
public class SuperconductorsTrainingXMLFormatterTest {
@@ -123,14 +126,18 @@ public void testDocumentConstruction_doubleKeywords_shouldThrowException() {
public void testDocumentConstruction() {
List spanListTitle = new ArrayList<>();
- span1.setOffsetStart(19);
- span1.setOffsetEnd(30);
- spanListTitle.add(span1);
+ Span anotherSpan = new Span("(TMTSF)2PF6", SUPERCONDUCTORS_MATERIAL_LABEL);
+ anotherSpan.setOffsetStart(19);
+ anotherSpan.setOffsetEnd(30);
+ spanListTitle.add(anotherSpan);
String textTitle = "The Bechgaard salt (TMTSF)2PF6 (TMTSF = tetra- methyltetraselenafulvalene) was";
List layoutTokensTitle = DeepAnalyzer.getInstance().tokenizeWithLayoutToken(textTitle);
+ Pair indexes = AdditionalLayoutTokensUtil.getExtremitiesAsIndex(layoutTokensTitle, 19, 30);
+ anotherSpan.setLayoutTokens(layoutTokensTitle.subList(indexes.getLeft(), indexes.getRight()));
List blocks = new ArrayList<>();
DocumentBlock documentBlockTitle = new DocumentBlock(layoutTokensTitle, DocumentBlock.SECTION_HEADER, DocumentBlock.SUB_SECTION_TITLE, spanListTitle, new ArrayList<>());
@@ -153,66 +160,121 @@ public void testDocumentConstruction() {
List spanListParagraph = new ArrayList<>();
- Span Span = new Span();
- Span.setOffsetStart(445);
- Span.setOffsetEnd(458);
- Span.setText("FeSe 1-x Te x");
- spanListParagraph.add(Span);
- Span Span2 = new Span();
- Span2.setOffsetStart(460);
- Span2.setOffsetEnd(471);
- Span2.setText("0.6 ≤ x ≤ 1");
- spanListParagraph.add(Span2);
- Span Span3 = new Span();
- Span3.setOffsetStart(549);
- Span3.setOffsetEnd(561);
- Span3.setText("x = 0.6 -0.9");
- spanListParagraph.add(Span3);
- Span Span4 = new Span();
- Span4.setOffsetStart(562);
- Span4.setOffsetEnd(569);
- Span4.setText("exhibit");
- spanListParagraph.add(Span4);
- Span Span5 = new Span();
- Span5.setOffsetStart(570);
- Span5.setOffsetEnd(592);
- Span5.setText("bulk superconductivity");
- spanListParagraph.add(Span5);
+ Span span1 = new Span();
+ span1.setOffsetStart(445);
+ span1.setOffsetEnd(458);
+ span1.setText("FeSe 1-x Te x");
+ spanListParagraph.add(span1);
+ indexes = AdditionalLayoutTokensUtil.getExtremitiesAsIndex(layoutTokensParagraph, 445, 458);
+ span1.setLayoutTokens(layoutTokensParagraph.subList(indexes.getLeft(), indexes.getRight()));
- Span Span6 = new Span();
- Span6.setOffsetStart(632);
- Span6.setOffsetEnd(647);
- Span6.setText("superconducting");
- spanListParagraph.add(Span6);
- Span Span7 = new Span();
- Span7.setOffsetStart(653);
- Span7.setOffsetEnd(675);
- Span7.setText("transition temperature");
- spanListParagraph.add(Span7);
+ Span span2 = new Span();
+ span2.setOffsetStart(460);
+ span2.setOffsetEnd(471);
+ span2.setText("0.6 ≤ x ≤ 1");
+ spanListParagraph.add(span2);
+ indexes = AdditionalLayoutTokensUtil.getExtremitiesAsIndex(layoutTokensParagraph, 460, 471);
+ span2.setLayoutTokens(layoutTokensParagraph.subList(indexes.getLeft(), indexes.getRight()));
+ Span span3 = new Span();
+ span3.setOffsetStart(549);
+ span3.setOffsetEnd(561);
+ span3.setText("x = 0.6 -0.9");
+ spanListParagraph.add(span3);
+ indexes = AdditionalLayoutTokensUtil.getExtremitiesAsIndex(layoutTokensParagraph, 549, 561);
+ span3.setLayoutTokens(layoutTokensParagraph.subList(indexes.getLeft(), indexes.getRight()));
+ Span span4 = new Span();
+ span4.setOffsetStart(562);
+ span4.setOffsetEnd(569);
+ span4.setText("exhibit");
+ spanListParagraph.add(span4);
+ indexes = AdditionalLayoutTokensUtil.getExtremitiesAsIndex(layoutTokensParagraph, 562, 569);
+ span4.setLayoutTokens(layoutTokensParagraph.subList(indexes.getLeft(), indexes.getRight()));
+ Span span5 = new Span();
+ span5.setOffsetStart(570);
+ span5.setOffsetEnd(592);
+ span5.setText("bulk superconductivity");
+ spanListParagraph.add(span5);
+ indexes = AdditionalLayoutTokensUtil.getExtremitiesAsIndex(layoutTokensParagraph, 570, 592);
+ span5.setLayoutTokens(layoutTokensParagraph.subList(indexes.getLeft(), indexes.getRight()));
+ Span span6 = new Span();
+ span6.setOffsetStart(632);
+ span6.setOffsetEnd(647);
+ span6.setText("superconducting");
+ spanListParagraph.add(span6);
+ indexes = AdditionalLayoutTokensUtil.getExtremitiesAsIndex(layoutTokensParagraph, 632, 647);
+ span6.setLayoutTokens(layoutTokensParagraph.subList(indexes.getLeft(), indexes.getRight()));
+ Span span7 = new Span();
+ span7.setOffsetStart(653);
+ span7.setOffsetEnd(675);
+ span7.setText("transition temperature");
+ spanListParagraph.add(span7);
+ indexes = AdditionalLayoutTokensUtil.getExtremitiesAsIndex(layoutTokensParagraph, 653, 675);
+ span7.setLayoutTokens(layoutTokensParagraph.subList(indexes.getLeft(), indexes.getRight()));
DocumentBlock blockParagraph = new DocumentBlock(layoutTokensParagraph, DocumentBlock.SECTION_BODY, DocumentBlock.SUB_SECTION_PARAGRAPH, spanListParagraph, new ArrayList<>());
// figure caption
- blocks.add(new DocumentBlock(layoutTokensParagraph, DocumentBlock.SECTION_BODY, DocumentBlock.SUB_SECTION_FIGURE, spanListParagraph, new ArrayList<>()));
+ blocks.add(new DocumentBlock(layoutTokensParagraph, DocumentBlock.SECTION_BODY, DocumentBlock.SUB_SECTION_FIGURE, "1", spanListParagraph, new ArrayList<>()));
- blocks.add(new DocumentBlock(layoutTokensParagraph, DocumentBlock.SECTION_BODY, DocumentBlock.SUB_SECTION_TABLE, spanListParagraph, new ArrayList<>()));
+ blocks.add(new DocumentBlock(layoutTokensParagraph, DocumentBlock.SECTION_BODY, DocumentBlock.SUB_SECTION_TABLE, "2", spanListParagraph, new ArrayList<>()));
target.format(blocks, 1234);
+ @Test
+ public void testGetParent_previousParentNotNull_sameParagraphId_shouldreturnPreviousParent() throws Exception {
+ Element body = teiElement("body");
+ Element previousParent = teiElement("p");
+ Element parent = target.getParentElement(body, "1234", "1234", previousParent, "ab", null);
+ assertThat(parent, is(previousParent));
+ }
+ @Test
+ public void testGetParent_previousParentNotNull_differentParagraphId_shouldreturnNewElement() throws Exception {
+ Element body = teiElement("body");
+ Element previousParent = teiElement("p");
+ Element parent = target.getParentElement(body, "1234", "12345", previousParent, "ab", null);
+ assertThat(parent, is(not(previousParent)));
+ }
+ @Test
+ public void testGetParent_previousParentNull_differentParagraphId_shouldreturnNewElement() throws Exception {
+ Element body = teiElement("body");
+ Element previousParent = null;
+ Element parent = target.getParentElement(body, "1234", "12345", previousParent, "ab", null);
+ assertThat(parent, is(not(previousParent)));
+ assertThat(parent.getLocalName(), is("ab"));
+ assertThat(parent.getAttributeCount(), is(0));
+ }
+ @Test
+ public void testGetParent_previousParentNull_sameParagraphId_shouldreturnNewElement() throws Exception {
+ Element body = teiElement("body");
+ Element previousParent = null;
+ Element parent = target.getParentElement(body, "1234", "1234", previousParent, "ab", null);
+ assertThat(parent, is(not(previousParent)));
+ assertThat(parent.getLocalName(), is("ab"));
+ assertThat(parent.getAttributeCount(), is(0));
+ }
public void testTrainingData_value() throws Exception {
List spanList = new ArrayList<>();
@@ -223,10 +285,13 @@ public void testTrainingData_value() throws Exception {
String text = "The Bechgaard salt (TMTSF)2PF6 (TMTSF = tetra- methyltetraselenafulvalene) was";
+ List tokens = DeepAnalyzer.getInstance().tokenizeWithLayoutToken(text);
+ span1.setLayoutTokens(tokens.subList(6, 13));
- Element out = target.trainingExtraction(spanList, DeepAnalyzer.getInstance().tokenizeWithLayoutToken(text));
+ Element out = target.trainingExtraction(spanList, tokens);
assertThat(out.toXML(), is("The Bechgaard salt (TMTSF)2PF6 (TMTSF = tetra- methyltetraselenafulvalene) was
@@ -247,12 +312,14 @@ public void testTrainingDataExtraction_withDefaultAndCustomTags() throws Excepti
superconductor.setText("FeSe 1-x Te x");
+ superconductor.setLayoutTokens(layoutTokens.subList(18, 27));
Span superconductor2 = new Span();
superconductor2.setText("0.6 ≤ x ≤ 1");
+ superconductor2.setLayoutTokens(layoutTokens.subList(29, 40));
@@ -290,18 +357,20 @@ public void testTrainingDataExtraction_textBody() throws Exception {
span1.setText("FeSe 1-x Te x");
+ span1.setLayoutTokens(layoutTokens.subList(18, 27));
Span span2 = new Span();
span2.setText("0.6 ≤ x ≤ 1");
+ span2.setLayoutTokens(layoutTokens.subList(29, 40));
List documentBlocks = new ArrayList<>();
- documentBlocks.add(new DocumentBlock(layoutTokens, DocumentBlock.SECTION_BODY, DocumentBlock.SUB_SECTION_PARAGRAPH, spanList, new ArrayList<>()));
+ documentBlocks.add(new DocumentBlock(layoutTokens, DocumentBlock.SECTION_BODY, DocumentBlock.SUB_SECTION_PARAGRAPH, "1", spanList, new ArrayList<>()));
//This will ensure that next time I modify the principle on which the offsets are calculated, will fail
int startingOffset = layoutTokens.get(0).getOffset();
@@ -311,7 +380,7 @@ public void testTrainingDataExtraction_textBody() throws Exception {
String output = target.format(documentBlocks, 1);
- endsWith("Specific-Heat Study of Superconducting and Normal States in FeSe 1-x Te x (0.6 ≤ x ≤ 1 ) Single Crystals: Strong-Coupling Superconductivity, Strong Electron-Correlation, and Inhomogeneity
+ endsWith("Specific-Heat Study of Superconducting and Normal States in FeSe 1-x Te x (0.6 ≤ x ≤ 1 ) Single Crystals: Strong-Coupling Superconductivity, Strong Electron-Correlation, and Inhomogeneity
@@ -326,57 +395,73 @@ public void textTrainingDataExtraction_textBody_withOffsets() throws Exception {
List spanList = new ArrayList<>();
- Span Span = new Span();
- Span.setOffsetStart(445);
- Span.setOffsetEnd(458);
- Span.setText("FeSe 1-x Te x");
- spanList.add(Span);
- Span Span2 = new Span();
- Span2.setOffsetStart(460);
- Span2.setOffsetEnd(471);
- Span2.setText("0.6 ≤ x ≤ 1");
- spanList.add(Span2);
- Span Span3 = new Span();
- Span3.setOffsetStart(549);
- Span3.setOffsetEnd(561);
- Span3.setText("x = 0.6 -0.9");
- spanList.add(Span3);
- Span Span4 = new Span();
- Span4.setOffsetStart(562);
- Span4.setOffsetEnd(569);
- Span4.setText("exhibit");
- spanList.add(Span4);
- Span Span5 = new Span();
- Span5.setOffsetStart(570);
- Span5.setOffsetEnd(592);
- Span5.setText("bulk superconductivity");
- spanList.add(Span5);
- Span Span6 = new Span();
- Span6.setOffsetStart(632);
- Span6.setOffsetEnd(647);
- Span6.setText("superconducting");
- spanList.add(Span6);
+ Span span1 = new Span();
+ span1.setOffsetStart(445);
+ span1.setOffsetEnd(458);
+ span1.setText("FeSe 1-x Te x");
+ spanList.add(span1);
+ Pair indexes = AdditionalLayoutTokensUtil.getExtremitiesAsIndex(layoutTokens, 445, 458);
+ span1.setLayoutTokens(layoutTokens.subList(indexes.getLeft(), indexes.getRight()));
- Span Span7 = new Span();
- Span7.setOffsetStart(653);
- Span7.setOffsetEnd(675);
- Span7.setText("transition temperature");
- spanList.add(Span7);
+ Span span2 = new Span();
+ span2.setOffsetStart(460);
+ span2.setOffsetEnd(471);
+ span2.setText("0.6 ≤ x ≤ 1");
+ spanList.add(span2);
+ indexes = AdditionalLayoutTokensUtil.getExtremitiesAsIndex(layoutTokens, 460, 471);
+ span2.setLayoutTokens(layoutTokens.subList(indexes.getLeft(), indexes.getRight()));
+ Span span3 = new Span();
+ span3.setOffsetStart(549);
+ span3.setOffsetEnd(561);
+ span3.setText("x = 0.6 -0.9");
+ spanList.add(span3);
+ indexes = AdditionalLayoutTokensUtil.getExtremitiesAsIndex(layoutTokens, 549, 561);
+ span3.setLayoutTokens(layoutTokens.subList(indexes.getLeft(), indexes.getRight()));
+ Span span4 = new Span();
+ span4.setOffsetStart(562);
+ span4.setOffsetEnd(569);
+ span4.setText("exhibit");
+ spanList.add(span4);
+ indexes = AdditionalLayoutTokensUtil.getExtremitiesAsIndex(layoutTokens, 562, 569);
+ span4.setLayoutTokens(layoutTokens.subList(indexes.getLeft(), indexes.getRight()));
+ Span span5 = new Span();
+ span5.setOffsetStart(570);
+ span5.setOffsetEnd(592);
+ span5.setText("bulk superconductivity");
+ spanList.add(span5);
+ indexes = AdditionalLayoutTokensUtil.getExtremitiesAsIndex(layoutTokens, 570, 592);
+ span5.setLayoutTokens(layoutTokens.subList(indexes.getLeft(), indexes.getRight()));
+ Span span6 = new Span();
+ span6.setOffsetStart(632);
+ span6.setOffsetEnd(647);
+ span6.setText("superconducting");
+ spanList.add(span6);
+ indexes = AdditionalLayoutTokensUtil.getExtremitiesAsIndex(layoutTokens, 632, 647);
+ span6.setLayoutTokens(layoutTokens.subList(indexes.getLeft(), indexes.getRight()));
+ Span span7 = new Span();
+ span7.setOffsetStart(653);
+ span7.setOffsetEnd(675);
+ span7.setText("transition temperature");
+ spanList.add(span7);
+ indexes = AdditionalLayoutTokensUtil.getExtremitiesAsIndex(layoutTokens, 653, 675);
+ span7.setLayoutTokens(layoutTokens.subList(indexes.getLeft(), indexes.getRight()));
List documentBlocks = new ArrayList<>();
- documentBlocks.add(new DocumentBlock(layoutTokens, DocumentBlock.SECTION_BODY, DocumentBlock.SUB_SECTION_PARAGRAPH, spanList, new ArrayList<>()));
+ documentBlocks.add(new DocumentBlock(layoutTokens, DocumentBlock.SECTION_BODY, DocumentBlock.SUB_SECTION_PARAGRAPH, "1", spanList, new ArrayList<>()));
//This will ensure that next time I modify the principle on which the offsets are calculated, will fail
int startingOffset = layoutTokens.get(0).getOffset();
@@ -387,11 +472,11 @@ public void textTrainingDataExtraction_textBody_withOffsets() throws Exception {
String output = target.format(documentBlocks, 1);
- is("The electronic specific heat of as-grown and annealed single-crystals of FeSe 1-x Te x (0.6 ≤ x ≤ 1 ) has been investigated. " +
+ is("The electronic specific heat of as-grown and annealed single-crystals of FeSe 1-x Te x (0.6 ≤ x ≤ 1 ) has been investigated. " +
"It has been found that annealed single-crystals with x = 0.6 -0.9 exhibit bulk superconductivity with a clear specific-heat jump at the superconducting (SC) transition temperature , T c . Both 2Δ 0 /k B T c [Δ 0 : the SC gap at 0 K estimated using the single-band BCS s-wave model] and ⊿C/(γ n -γ 0 )T c [⊿C: the specific-heat jump at T c , γ n : the electronic specific-heat coefficient in the normal state, γ 0 : the residual electronic specific-heat coefficient at 0 K in the SC state] are largest in the well-annealed single-crystal with x = 0.7, i.e., 4.29 and 2.76, respectively, indicating that the superconductivity is of the strong coupling. " +
"The thermodynamic critical field has also been estimated. " +
"γ n has been found to be one order of magnitude larger than those estimated from the band calculations and increases with increasing x at x = 0.6 -0.9, which is surmised to be due to the increase in the electronic effective mass, namely, the enhancement of the electron correlation. " +
- "It has been found that there remains a finite value of γ 0 in the SC state even in the well-annealed single-crystals with x = 0.8 -0.9, suggesting an inhomogeneous electronic state in real space and/or momentum space.
+ "It has been found that there remains a finite value of γ 0 in the SC state even in the well-annealed single-crystals with x = 0.8 -0.9, suggesting an inhomogeneous electronic state in real space and/or momentum space.
@Test(expected = RuntimeException.class)
diff --git a/src/test/java/org/grobid/service/controller/AnnotationControllerTest.java b/src/test/java/org/grobid/service/controller/AnnotationControllerTest.java
index 224fac65..8caa5101 100644
--- a/src/test/java/org/grobid/service/controller/AnnotationControllerTest.java
+++ b/src/test/java/org/grobid/service/controller/AnnotationControllerTest.java
@@ -1,41 +1,40 @@
package org.grobid.service.controller;
-import com.squarespace.jersey2.guice.JerseyGuiceUtils;
-import io.dropwizard.testing.junit.ResourceTestRule;
import org.glassfish.jersey.media.multipart.FormDataMultiPart;
import org.glassfish.jersey.media.multipart.MultiPart;
import org.glassfish.jersey.media.multipart.MultiPartFeature;
import org.junit.ClassRule;
import org.junit.Test;
-import javax.ws.rs.client.Entity;
+import jakarta.ws.rs.client.Entity;
-import static javax.ws.rs.core.MediaType.APPLICATION_JSON_TYPE;
+import static jakarta.ws.rs.core.MediaType.APPLICATION_JSON_TYPE;
-public class AnnotationControllerTest {
- static {
- JerseyGuiceUtils.install((s, serviceLocator) -> null);
- }
- @ClassRule
- public static final ResourceTestRule RULE = ResourceTestRule.builder()
- .addResource(new AnnotationController(null, null))
- .addProvider(MultiPartFeature.class)
- .build();
+public class AnnotationControllerTest {
- @Test
- public void testResource() {
- final MultiPart multiPartEntity = new FormDataMultiPart()
- .field("input", "{\"runtime\": 1234}", APPLICATION_JSON_TYPE);
- String s = RULE.client().target("/process/json")
- .register(MultiPartFeature.class).request()
- .post(Entity.entity(multiPartEntity, multiPartEntity.getMediaType()))
- .readEntity(String.class);
- System.out.println(s);
- }
+// static {
+// JerseyGuiceUtils.install((s, serviceLocator) -> null);
+// }
+// @ClassRule
+// public static final ResourceTestRule RULE = ResourceTestRule.builder()
+// .addResource(new AnnotationController(null, null))
+// .addProvider(MultiPartFeature.class)
+// .build();
+// @Test
+// public void testResource() {
+// final MultiPart multiPartEntity = new FormDataMultiPart()
+// .field("input", "{\"runtime\": 1234}", APPLICATION_JSON_TYPE);
+// String s = RULE.client().target("/process/json")
+// .register(MultiPartFeature.class).request()
+// .post(Entity.entity(multiPartEntity, multiPartEntity.getMediaType()))
+// .readEntity(String.class);
+// System.out.println(s);
+// }
\ No newline at end of file