Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

_TAGS for fine-grained tasks #703

Open
wants to merge 20 commits into
base: main
Choose a base branch
from
3 changes: 2 additions & 1 deletion bigbio/biodatasets/an_em/an_em.py
Original file line number Diff line number Diff line change
Expand Up @@ -29,9 +29,10 @@
import bigbio.utils.parsing as parse
from bigbio.utils import schemas
from bigbio.utils.configs import BigBioConfig
from bigbio.utils.constants import Lang, Tasks
from bigbio.utils.constants import Lang, Tags, Tasks
from bigbio.utils.license import Licenses

_TAGS = [Tags.ANATOMY]
_LANGUAGES = [Lang.EN]
_PUBMED = True
_LOCAL = False
Expand Down
3 changes: 2 additions & 1 deletion bigbio/biodatasets/anat_em/anat_em.py
Original file line number Diff line number Diff line change
Expand Up @@ -27,9 +27,10 @@
import bigbio.utils.parsing as parsing
from bigbio.utils import schemas
from bigbio.utils.configs import BigBioConfig
from bigbio.utils.constants import Lang, Tasks
from bigbio.utils.constants import Lang, Tags, Tasks
from bigbio.utils.license import Licenses

_TAGS = [Tags.ANATOMY]
_LANGUAGES = [Lang.EN]
_PUBMED = True
_LOCAL = False
Expand Down
3 changes: 2 additions & 1 deletion bigbio/biodatasets/ask_a_patient/ask_a_patient.py
Original file line number Diff line number Diff line change
Expand Up @@ -21,11 +21,12 @@

from bigbio.utils import schemas
from bigbio.utils.configs import BigBioConfig
from bigbio.utils.constants import Lang, Tasks
from bigbio.utils.constants import Lang, Tags, Tasks
from bigbio.utils.license import Licenses

_DATASETNAME = "ask_a_patient"

_TAGS = [Tags.ADR]
_LANGUAGES = [Lang.EN]
_PUBMED = True
_LOCAL = False
Expand Down
3 changes: 2 additions & 1 deletion bigbio/biodatasets/bc5cdr/bc5cdr.py
Original file line number Diff line number Diff line change
Expand Up @@ -31,10 +31,11 @@

from bigbio.utils import schemas
from bigbio.utils.configs import BigBioConfig
from bigbio.utils.constants import Lang, Tasks
from bigbio.utils.constants import Lang, Tags, Tasks
from bigbio.utils.license import Licenses
from bigbio.utils.parsing import get_texts_and_offsets_from_bioc_ann

_TAGS = [Tags.DISEASE, Tags.CHEMICAL]
_LANGUAGES = [Lang.EN]
_PUBMED = True
_LOCAL = False
Expand Down
3 changes: 2 additions & 1 deletion bigbio/biodatasets/bc7_litcovid/bc7_litcovid.py
Original file line number Diff line number Diff line change
Expand Up @@ -20,9 +20,10 @@

from bigbio.utils import schemas
from bigbio.utils.configs import BigBioConfig
from bigbio.utils.constants import Lang, Tasks
from bigbio.utils.constants import Lang, Tags, Tasks
from bigbio.utils.license import Licenses

_TAGS = [Tags.COVID]
_LANGUAGES = [Lang.EN]
_PUBMED = True
_LOCAL = False
Expand Down
3 changes: 2 additions & 1 deletion bigbio/biodatasets/bio_sim_verb/bio_sim_verb.py
Original file line number Diff line number Diff line change
Expand Up @@ -27,10 +27,11 @@

from bigbio.utils import schemas
from bigbio.utils.configs import BigBioConfig
from bigbio.utils.constants import Lang, Tasks
from bigbio.utils.constants import Lang, Tags, Tasks
from bigbio.utils.license import Licenses

# TODO: Add BibTeX citation
_TAGS = [Tags.LEXICAL]
_LANGUAGES = [Lang.EN]
_PUBMED = True
_LOCAL = False
Expand Down
3 changes: 2 additions & 1 deletion bigbio/biodatasets/bio_simlex/bio_simlex.py
Original file line number Diff line number Diff line change
Expand Up @@ -27,10 +27,11 @@

from bigbio.utils import schemas
from bigbio.utils.configs import BigBioConfig
from bigbio.utils.constants import Lang, Tasks
from bigbio.utils.constants import Lang, Tags, Tasks
from bigbio.utils.license import Licenses

# TODO: Add BibTeX citation
_TAGS = [Tags.LEXICAL]
_LANGUAGES = [Lang.EN]
_PUBMED = True
_LOCAL = False
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -51,9 +51,10 @@

from bigbio.utils import schemas
from bigbio.utils.configs import BigBioConfig
from bigbio.utils.constants import Lang, Tasks
from bigbio.utils.constants import Lang, Tags, Tasks
from bigbio.utils.license import Licenses

_TAGS = [Tags.DOCUMENT_INDEXING]
_LANGUAGES = [Lang.ES]
_PUBMED = False
_LOCAL = False
Expand Down
9 changes: 8 additions & 1 deletion bigbio/biodatasets/bioasq_task_b/bioasq_task_b.py
Original file line number Diff line number Diff line change
Expand Up @@ -32,9 +32,16 @@

from bigbio.utils import schemas
from bigbio.utils.configs import BigBioConfig
from bigbio.utils.constants import Lang, Tasks
from bigbio.utils.constants import Lang, Tags, Tasks
from bigbio.utils.license import Licenses

_TAGS = [
Tags.YESNO,
Tags.FACTOID,
Tags.FACTOID_LIST,
Tags.ABSTRACTIVE,
Tags.EXTRACTIVE,
]
_LANGUAGES = [Lang.EN]
_PUBMED = True
_LOCAL = True
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -23,9 +23,10 @@

from bigbio.utils import schemas
from bigbio.utils.configs import BigBioConfig
from bigbio.utils.constants import Lang, Tasks
from bigbio.utils.constants import Lang, Tags, Tasks
from bigbio.utils.license import Licenses

_TAGS = [Tags.GRANT]
_LANGUAGES = [Lang.EN]
_PUBMED = True
_LOCAL = True
Expand Down
3 changes: 2 additions & 1 deletion bigbio/biodatasets/bioinfer/bioinfer.py
Original file line number Diff line number Diff line change
Expand Up @@ -25,9 +25,10 @@

from bigbio.utils import schemas
from bigbio.utils.configs import BigBioConfig
from bigbio.utils.constants import Lang, Tasks
from bigbio.utils.constants import Lang, Tags, Tasks
from bigbio.utils.license import Licenses

_TAGS = [Tags.PPI]
_LANGUAGES = [Lang.EN]
_PUBMED = True
_LOCAL = False
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -30,9 +30,10 @@

from bigbio.utils import schemas
from bigbio.utils.configs import BigBioConfig
from bigbio.utils.constants import Lang, Tasks
from bigbio.utils.constants import Lang, Tags, Tasks
from bigbio.utils.license import Licenses

_TAGS = [Tags.HOW, Tags.WHY]
_LANGUAGES = [Lang.EN]
_PUBMED = False
_LOCAL = False
Expand Down
3 changes: 2 additions & 1 deletion bigbio/biodatasets/biomrc/biomrc.py
Original file line number Diff line number Diff line change
Expand Up @@ -31,9 +31,10 @@

from bigbio.utils import schemas
from bigbio.utils.configs import BigBioConfig
from bigbio.utils.constants import Lang, Tasks
from bigbio.utils.constants import Lang, Tags, Tasks
from bigbio.utils.license import Licenses

_TAGS = [Tags.MULTIPLE_CHOICE, Tags.MRC, Tags.CLOZE_TEST]
_LANGUAGES = [Lang.EN]
_PUBMED = True
_LOCAL = False
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -21,10 +21,15 @@

from bigbio.utils import schemas
from bigbio.utils.configs import BigBioConfig
from bigbio.utils.constants import Lang, Tasks
from bigbio.utils.constants import Lang, Tags, Tasks
from bigbio.utils.license import Licenses
from bigbio.utils.parsing import brat_parse_to_bigbio_kb, parse_brat_file

# http://www.wikicfp.com/cfp/servlet/event.showcfp?eventid=4605&copyownerid=320
# Task 1. Event detection and characterization
# Task 2. Event argument recognition
# Task 3. Recognition of negations and speculations
_TAGS = [Tags.PPI, Tags.NEGATION, Tags.SPECULATION, Tags.GENE]
_LANGUAGES = [Lang.EN]
_PUBMED = True
_LOCAL = False
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -21,13 +21,14 @@

from bigbio.utils import parsing, schemas
from bigbio.utils.configs import BigBioConfig
from bigbio.utils.constants import Lang, Tasks
from bigbio.utils.constants import Lang, Tags, Tasks
from bigbio.utils.license import Licenses

_DATASETNAME = "bionlp_st_2011_epi"
_SOURCE_VIEW_NAME = "source"
_UNIFIED_VIEW_NAME = "bigbio"

_TAGS = [Tags.EPIGENETICS, Tags.NEGATION, Tags.SPECULATION, Tags.GENE]
_LANGUAGES = [Lang.EN]
_PUBMED = True
_LOCAL = False
Expand Down
3 changes: 2 additions & 1 deletion bigbio/biodatasets/bionlp_st_2011_ge/bionlp_st_2011_ge.py
Original file line number Diff line number Diff line change
Expand Up @@ -20,13 +20,14 @@

from bigbio.utils import parsing, schemas
from bigbio.utils.configs import BigBioConfig
from bigbio.utils.constants import Lang, Tasks
from bigbio.utils.constants import Lang, Tags, Tasks
from bigbio.utils.license import Licenses

_DATASETNAME = "bionlp_st_2011_ge"
_SOURCE_VIEW_NAME = "source"
_UNIFIED_VIEW_NAME = "bigbio"

_TAGS = [Tags.NEGATION, Tags.SPECULATION, Tags.GENE]
_LANGUAGES = [Lang.EN]
_PUBMED = True
_LOCAL = False
Expand Down
10 changes: 9 additions & 1 deletion bigbio/biodatasets/bionlp_st_2011_id/bionlp_st_2011_id.py
Original file line number Diff line number Diff line change
Expand Up @@ -20,13 +20,21 @@

from bigbio.utils import parsing, schemas
from bigbio.utils.configs import BigBioConfig
from bigbio.utils.constants import Lang, Tasks
from bigbio.utils.constants import Lang, Tags, Tasks
from bigbio.utils.license import Licenses

_DATASETNAME = "bionlp_st_2011_id"
_SOURCE_VIEW_NAME = "source"
_UNIFIED_VIEW_NAME = "bigbio"

_TAGS = [
Tags.DISEASE,
Tags.GENE,
Tags.CHEMICAL,
Tags.SPECIES,
Tags.SPECULATION,
Tags.NEGATION,
]
_LANGUAGES = [Lang.EN]
_PUBMED = True
_LOCAL = False
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -20,13 +20,14 @@

from bigbio.utils import parsing, schemas
from bigbio.utils.configs import BigBioConfig
from bigbio.utils.constants import Lang, Tasks
from bigbio.utils.constants import Lang, Tags, Tasks
from bigbio.utils.license import Licenses

_DATASETNAME = "bionlp_st_2011_rel"
_SOURCE_VIEW_NAME = "source"
_UNIFIED_VIEW_NAME = "bigbio"

_TAGS = [Tags.PART_OF, Tags.GENE]
_LANGUAGES = [Lang.EN]
_PUBMED = True
_LOCAL = False
Expand Down
12 changes: 11 additions & 1 deletion bigbio/biodatasets/bionlp_st_2013_cg/bionlp_st_2013_cg.py
Original file line number Diff line number Diff line change
Expand Up @@ -20,12 +20,22 @@

from bigbio.utils import parsing, schemas
from bigbio.utils.configs import BigBioConfig
from bigbio.utils.constants import Lang, Tasks
from bigbio.utils.constants import Lang, Tags, Tasks
from bigbio.utils.license import Licenses

_DATASETNAME = "bionlp_st_2013_cg"
_UNIFIED_VIEW_NAME = "bigbio"

_TAGS = [
Tags.DISEASE,
Tags.CANCER,
Tags.TISSUE,
Tags.SPECIES,
Tags.CELL,
Tags.GENE,
Tags.CHEMICAL,
Tags.PATHWAY_CURATION,
]
_LANGUAGES = [Lang.EN]
_PUBMED = True
_LOCAL = False
Expand Down
3 changes: 2 additions & 1 deletion bigbio/biodatasets/bionlp_st_2013_ge/bionlp_st_2013_ge.py
Original file line number Diff line number Diff line change
Expand Up @@ -20,13 +20,14 @@

from bigbio.utils import parsing, schemas
from bigbio.utils.configs import BigBioConfig
from bigbio.utils.constants import Lang, Tasks
from bigbio.utils.constants import Lang, Tags, Tasks
from bigbio.utils.license import Licenses

_DATASETNAME = "bionlp_st_2013_ge"
_SOURCE_VIEW_NAME = "source"
_UNIFIED_VIEW_NAME = "bigbio"

_TAGS = [Tags.NEGATION, Tags.SPECULATION, Tags.GENE]
_LANGUAGES = [Lang.EN]
_PUBMED = True
_LOCAL = False
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -21,13 +21,14 @@

from bigbio.utils import parsing, schemas
from bigbio.utils.configs import BigBioConfig
from bigbio.utils.constants import Lang, Tasks
from bigbio.utils.constants import Lang, Tags, Tasks
from bigbio.utils.license import Licenses

_DATASETNAME = "bionlp_st_2013_gro"
_SOURCE_VIEW_NAME = "source"
_UNIFIED_VIEW_NAME = "bigbio"

_TAGS = [Tags.GENE, Tags.SPECIES, Tags.CELL, Tags.TISSUE]
_LANGUAGES = [Lang.EN]
_PUBMED = True
_LOCAL = False
Expand Down
9 changes: 8 additions & 1 deletion bigbio/biodatasets/bionlp_st_2013_pc/bionlp_st_2013_pc.py
Original file line number Diff line number Diff line change
Expand Up @@ -20,12 +20,19 @@

from bigbio.utils import parsing, schemas
from bigbio.utils.configs import BigBioConfig
from bigbio.utils.constants import Lang, Tasks
from bigbio.utils.constants import Lang, Tags, Tasks
from bigbio.utils.license import Licenses

_DATASETNAME = "bionlp_st_2013_pc"
_UNIFIED_VIEW_NAME = "bigbio"

_TAGS = [
Tags.GENE,
Tags.CHEMICAL,
Tags.PATHWAY_CURATION,
Tags.NEGATION,
Tags.SPECULATION,
]
_LANGUAGES = [Lang.EN]
_PUBMED = True
_LOCAL = False
Expand Down
3 changes: 2 additions & 1 deletion bigbio/biodatasets/bionlp_st_2019_bb/bionlp_st_2019_bb.py
Original file line number Diff line number Diff line change
Expand Up @@ -20,13 +20,14 @@

from bigbio.utils import parsing, schemas
from bigbio.utils.configs import BigBioConfig
from bigbio.utils.constants import Lang, Tasks
from bigbio.utils.constants import Lang, Tags, Tasks
from bigbio.utils.license import Licenses

_DATASETNAME = "bionlp_st_2019_bb"
_SOURCE_VIEW_NAME = "source"
_UNIFIED_VIEW_NAME = "bigbio"

_TAGS = [Tags.SPECIES]
_LANGUAGES = [Lang.EN]
_PUBMED = True
_LOCAL = False
Expand Down
3 changes: 2 additions & 1 deletion bigbio/biodatasets/biored/biored.py
Original file line number Diff line number Diff line change
Expand Up @@ -26,10 +26,11 @@

from bigbio.utils import schemas
from bigbio.utils.configs import BigBioConfig
from bigbio.utils.constants import Lang, Tasks
from bigbio.utils.constants import Lang, Tags, Tasks
from bigbio.utils.license import Licenses

# TODO: Add BibTeX citation
_TAGS = [Tags.GENE, Tags.DISEASE, Tags.CHEMICAL, Tags.VARIANT, Tags.PPI]
_LANGUAGES = [Lang.EN]
_PUBMED = True
_LOCAL = False
Expand Down
3 changes: 2 additions & 1 deletion bigbio/biodatasets/biorelex/biorelex.py
Original file line number Diff line number Diff line change
Expand Up @@ -35,10 +35,11 @@

from bigbio.utils import schemas
from bigbio.utils.configs import BigBioConfig
from bigbio.utils.constants import Lang, Tasks
from bigbio.utils.constants import Lang, Tags, Tasks
from bigbio.utils.license import Licenses

# TODO: Add BibTeX citation
_TAGS = [Tags.GENE, Tags.CHEMICAL, Tags.VARIANT, Tags.NEGATION, Tags.SPECULATION]
_LANGUAGES = [Lang.EN]
_PUBMED = True
_LOCAL = False
Expand Down
3 changes: 2 additions & 1 deletion bigbio/biodatasets/bioscope/bioscope.py
Original file line number Diff line number Diff line change
Expand Up @@ -35,9 +35,10 @@

from bigbio.utils import schemas
from bigbio.utils.configs import BigBioConfig
from bigbio.utils.constants import Lang, Tasks
from bigbio.utils.constants import Lang, Tags, Tasks
from bigbio.utils.license import Licenses

_TAGS = [Tags.NEGATION, Tags.SPECULATION]
_LANGUAGES = [Lang.EN]
_PUBMED = True
_LOCAL = False
Expand Down
3 changes: 2 additions & 1 deletion bigbio/biodatasets/biosses/biosses.py
Original file line number Diff line number Diff line change
Expand Up @@ -28,11 +28,12 @@

from bigbio.utils import schemas
from bigbio.utils.configs import BigBioConfig
from bigbio.utils.constants import Lang, Tasks
from bigbio.utils.constants import Lang, Tags, Tasks
from bigbio.utils.license import Licenses

_DATASETNAME = "biosses"

_TAGS = [Tags.SENTENCE]
_LANGUAGES = [Lang.EN]
_PUBMED = False
_LOCAL = False
Expand Down
Loading