Spaces:

ai4data
/

datause-detector

Running

rafmacalaba commited on 17 days ago

Commit

ab71a6e

1 Parent(s): 929cf45

add labels and rels

Files changed (1) hide show

app.py CHANGED Viewed

@@ -11,10 +11,6 @@ _CACHE_DIR = os.environ.get("CACHE_DIR", None)
 from gliner import GLiNER
 from gliner.multitask import GLiNERRelationExtractor
-# Import inference pipeline and configuration
-from my_project.pipeline import inference_pipeline
-from my_project.config import TYPE2RELS, labels
 # Cache and initialize model + relation extractor
 DATA_MODEL_ID = "rafmacalaba/gliner_re_finetuned-v3"
 model = GLiNER.from_pretrained(DATA_MODEL_ID, cache_dir=_CACHE_DIR)
@@ -34,6 +30,17 @@ SAMPLE_TEXT = (
 # Post-processing: prune acronyms and self-relations
 def prune_acronym_and_self_relations(ner_preds, rel_preds):
     # 1) Find acronym targets strictly shorter than their source
     acronym_targets = {

 from gliner import GLiNER
 from gliner.multitask import GLiNERRelationExtractor
 # Cache and initialize model + relation extractor
 DATA_MODEL_ID = "rafmacalaba/gliner_re_finetuned-v3"
 model = GLiNER.from_pretrained(DATA_MODEL_ID, cache_dir=_CACHE_DIR)
 # Post-processing: prune acronyms and self-relations
+labels = ['named dataset', 'unnamed dataset', 'vague dataset']
+rels = ['acronym', 'author', 'data description',\
+        'data geography', 'data source', 'data type',\
+        'publication year', 'publisher', 'reference year', 'version']
+TYPE2RELS = {
+    "named dataset":   rels,
+    "unnamed dataset": rels,
+    "vague dataset":   rels,
+}
 def prune_acronym_and_self_relations(ner_preds, rel_preds):
     # 1) Find acronym targets strictly shorter than their source
     acronym_targets = {