var base_url=".";var index_prefix="JSS-subindex-";var doc_url=[
"101",
"102",
"104",
"105",
"106",
"107",
"108",
"109",
"10",
"114",
"115",
"116",
"117",
"119",
"11",
"120",
"121",
"123",
"124",
"126",
"129",
"130",
"132",
"133",
"136",
"137",
"139",
"13",
"142",
"143",
"144",
"145",
"146",
"147",
"149",
"152",
"154",
"155",
"156",
"157",
"158",
"159",
"15",
"160",
"161",
"162",
"163",
"164",
"165",
"166",
"168",
"169",
"172",
"173",
"174",
"175",
"176",
"177",
"17",
"184",
"185",
"186",
"187",
"188",
"189",
"190",
"191",
"192",
"193",
"197",
"198",
"200",
"202",
"203",
"204",
"205",
"207",
"208",
"20",
"210",
"211",
"212",
"213",
"214",
"215",
"216",
"217",
"218",
"219",
"21",
"220",
"221",
"222",
"226",
"227",
"228",
"229",
"22",
"231",
"234",
"235",
"236",
"237",
"238",
"239",
"23",
"240",
"241",
"244",
"246",
"247",
"249",
"24",
"250",
"253",
"254",
"255",
"256",
"258",
"259",
"25",
"262",
"264",
"26",
"270",
"272",
"273",
"274",
"275",
"276",
"277",
"278",
"279",
"280",
"281",
"283",
"284",
"286",
"287",
"288",
"289",
"28",
"290",
"291",
"292",
"293",
"294",
"295",
"296",
"297",
"299",
"300",
"301",
"303",
"304",
"306",
"308",
"309",
"30",
"313",
"315",
"316",
"317",
"319",
"321",
"322",
"323",
"324",
"326",
"327",
"328",
"329",
"32",
"330",
"331",
"334",
"335",
"336",
"337",
"340",
"342",
"343",
"344",
"345",
"346",
"347",
"348",
"349",
"351",
"352",
"353",
"355",
"358",
"359",
"35",
"361",
"363",
"364",
"365",
"366",
"368",
"370",
"373",
"375",
"376",
"377",
"378",
"37",
"380",
"382",
"383",
"384",
"385",
"386",
"389",
"38",
"390",
"391",
"392",
"393",
"397",
"398",
"399",
"39",
"400",
"402",
"403",
"404",
"405",
"407",
"409",
"410",
"411",
"415",
"418",
"419",
"420",
"421",
"422",
"423",
"424",
"425",
"427",
"428",
"429",
"42",
"433",
"434",
"435",
"437",
"438",
"439",
"43",
"440",
"442",
"443",
"444",
"445",
"447",
"448",
"449",
"44",
"451",
"454",
"455",
"458",
"459",
"45",
"460",
"461",
"463",
"465",
"468",
"469",
"46",
"471",
"472",
"473",
"475",
"477",
"478",
"479",
"481",
"482",
"483",
"484",
"486",
"487",
"48",
"490",
"491",
"493",
"495",
"496",
"499",
"49",
"500",
"501",
"502",
"507",
"509",
"50",
"510",
"511",
"512",
"514",
"515",
"516",
"518",
"519",
"51",
"520",
"521",
"522",
"523",
"524",
"528",
"52",
"533",
"534",
"535",
"536",
"537",
"538",
"539",
"540",
"541",
"542",
"543",
"544",
"545",
"546",
"547",
"549",
"54",
"550",
"551",
"552",
"553",
"554",
"556",
"557",
"558",
"559",
"55",
"560",
"561",
"562",
"564",
"565",
"566",
"567",
"568",
"569",
"56",
"573",
"574",
"575",
"576",
"577",
"578",
"57",
"580",
"581",
"582",
"583",
"584",
"586",
"587",
"588",
"590",
"592",
"594",
"595",
"596",
"598",
"599",
"600",
"604",
"606",
"607",
"608",
"609",
"60",
"610",
"611",
"612",
"613",
"614",
"616",
"617",
"618",
"619",
"61",
"620",
"621",
"622",
"623",
"624",
"625",
"626",
"627",
"628",
"629",
"62",
"630",
"631",
"632",
"635",
"638",
"639",
"640",
"641",
"643",
"644",
"645",
"647",
"648",
"64",
"651",
"652",
"654",
"656",
"657",
"658",
"660",
"661",
"662",
"663",
"664",
"665",
"66",
"671",
"674",
"676",
"677",
"678",
"679",
"67",
"685",
"686",
"68",
"691",
"693",
"695",
"698",
"699",
"69",
"700",
"702",
"706",
"707",
"709",
"70",
"710",
"712",
"713",
"715",
"716",
"717",
"718",
"71",
"720",
"721",
"722",
"724",
"725",
"728",
"729",
"72",
"732",
"733",
"734",
"735",
"736",
"737",
"738",
"739",
"73",
"740",
"741",
"742",
"743",
"746",
"748",
"749",
"750",
"751",
"754",
"755",
"758",
"759",
"75",
"760",
"762",
"763",
"764",
"765",
"769",
"76",
"770",
"771",
"772",
"773",
"774",
"775",
"776",
"777",
"779",
"77",
"780",
"783",
"784",
"785",
"786",
"787",
"788",
"789",
"78",
"790",
"791",
"793",
"794",
"795",
"796",
"797",
"798",
"79",
"7",
"802",
"804",
"805",
"806",
"807",
"811",
"812",
"813",
"814",
"815",
"816",
"817",
"818",
"819",
"820",
"821",
"822",
"823",
"825",
"826",
"827",
"828",
"830",
"831",
"832",
"835",
"83",
"843",
"844",
"847",
"848",
"849",
"84",
"851",
"855",
"856",
"858",
"860",
"861",
"862",
"863",
"864",
"866",
"867",
"869",
"86",
"870",
"871",
"873",
"874",
"875",
"877",
"87",
"880",
"881",
"882",
"884",
"885",
"886",
"887",
"88",
"892",
"894",
"896",
"898",
"899",
"89",
"8",
"900",
"901",
"902",
"903",
"904",
"907",
"908",
"909",
"90",
"911",
"912",
"913",
"914",
"915",
"917",
"91",
"92",
"93",
"94",
"95",
"96",
"97",
"99"];
var doc_title=["The Encoding of lexical implications in VerbNet Predicates of change of locations",
"STC-TIMIT: Generation of a Single-channel Telephone Corpus",
"Evaluation of Linguistics-Based Translation",
"The U.S. Policy Agenda Legislation Corpus Volume 1 - a Language Resource from 1947 - 1998",
"SpatialML: Annotation Scheme, Corpora, and Tools",
"Selection of Japanese-English Equivalents by Integrating High-quality Corpora and Huge Amounts of Web Data",
"Integrating Metaphor Information into RDF/OWL EuroWordNet",
"Exploiting Lexical Resources for Disambiguating CJK and Arabic Orthographic Variants",
"A Compact Arabic Lexical Semantics Language Resource Based on the Theory of Semantic Fields",
"Does Netgraph Fit Prague Dependency Treebank?",
"Modeling Document Dynamics: an Evolutionary Approach",
"Evaluation of a Machine Translation System for Low Resource Languages: METIS-II",
"Tapping Huge Temporally Indexed Textual Resources with WCTAnalyze",
"Evaluation of Different Segmentation Techniques for Dialogue Turns",
"Benchmarking Textual Annotation Tools for the Semantic Web",
"Subdomain Sensitive Statistical Parsing using Raw Corpora",
"Swedish-Turkish Parallel Treebank",
"Evaluating Summaries Automatically - A system Proposal",
"Comparing Dependency and Constituent Syntax for Frame-semantic Analysis",
"Sentence Alignment in DPC: Maximizing Precision, Minimizing Human Effort",
"MeSH&copy;: from a Controlled Vocabulary to a Processable Resource",
"Building Affective Lexicons from Specific Corpora for Automatic Sentiment Analysis",
"The IFADV Corpus: a Free Dialog Video Corpus",
"A Multi-Lingual Dictionary of Dirty Words",
"Uncertainty Corpus: Resource to Study User Affect in Complex Spoken Dialogue Systems",
"Annotation Guidelines for Chinese-Korean Word Alignment",
"Ontology-Based XQuery&#146;ing of XML-Encoded Language Resources on Multiple Annotation Layers",
"Introducing DRS (The Digital Replay System): a Tool for the Future of Corpus Linguistic Research and Analysis",
"LexSchem: a Large Subcategorization Lexicon for French Verbs",
"FATE: a FrameNet-Annotated Corpus for Textual Entailment",
"Do we Still Need Gold Standards for Evaluation?",
"Automatic Document Quality Control",
"Unsupervised Resource Creation for Textual Inference Applications",
"Eksairesis: A Domain-Adaptable System for Ontology Building from Unstructured Text",
"On the Role of the NIMITEK Corpus in Developing an Emotion Adaptive Spoken Dialogue System",
"A Trainable Tokenizer, solution for multilingual texts and compound expression tokenization",
"Learning-based Detection of Scientific Terms in Patient Information",
"On the Use of Web Resources and Natural Language Processing Techniques to Improve Automatic Speech Recognition Systems",
"Language Resources and Tools for Swedish: A Survey",
"Detecting Errors in Semantic Annotation",
"Saxon: an Extensible Multimedia Annotator",
"Glossa: a Multilingual, Multimodal, Configurable User Interface",
"A Semantically Annotated Swedish Medical Corpus",
"Classification Procedures for Software Evaluation",
"A Test Suite for Inference Involving Adjectives",
"Cleaneval: a Competition for Cleaning Web Pages",
"From Field Notes towards a Knowledge Base",
"SCARE: a Situated Corpus with Annotated Referring Expressions",
"Automatic Assessment of Japanese Text Readability Based on a Textbook Corpus",
"ParsCit: an Open-source CRF Reference String Parsing Package",
"Sign Language Corpus Annotation: toward a new Methodology",
"Automatic Acquisition of Usage Information for Language Resources",
"Automatic Rich Annotation of Large Corpus of Conversational transcribed speech: the Chunking Task of the EPAC Project",
"Automatic Translation of Biomedical Terms by Supervised Machine Learning",
"Morphosyntactic Resources for Automatic Speech Recognition",
"Automatic Construction of a Japanese-Chinese Dictionary via English",
"The Kalshnikov 691 Dependency Bank",
"Cost-Sensitive Learning in Answer Extraction",
"LIRICS Semantic Role Annotation: Design and Evaluation of a Set of Data Categories",
"Adjectives in the Dutch Semantic Lexical Database CORNETTO",
"Analysis and Performance of Morphological Query Expansion and Language-Filtering Words on Basque Web Searching",
"Chooser: a Multi-Task Annotation Tool",
"Corpus Analysis of Spoken Smart-Home Interactions with Older Users",
"Named Entity WordNet",
"Turning a Term Extractor into a new Domain: first Experiences",
"Presentation of the New ISO-Standard for the Representation of Entries in Dictionaries: ISO 1951",
"New Functions of FrameSQL for Multilingual FrameNets",
"Named Entity Relation Mining using Wikipedia",
"Local Methods for On-Demand Out-of-Vocabulary Word Retrieval",
"Acquisition and Evaluation of a Dialog Corpus through WOz and Dialog Simulation Techniques",
"Rapid Deployment of a New METIS Language Pair: Catalan-English",
"Developing a TT-MCTAG for German with an RCG-based Parser",
"Towards a Vector Space Model for FrameNet-like Resources",
"AnCora-Verb: A Lexical Resource for the Semantic Annotation of Corpora",
"Ensuring Semantic Interoperability on Lexical Resources",
"Exploring and Enriching a Language Resource Archive via the Web",
"Cross-Corpus Evaluation of Word Alignment",
"Annotation by Category: ELAN and ISO DCR",
"Investigating the Structure of Procedural Texts for Answering How-to Questions",
"A Simple Method for Tagset Comparision",
"Towards the National Corpus of Polish",
"&#9824; Demo: An Open Source Tool for Partial Parsing and Morphosyntactic Disambiguation",
"Definition Extraction Using a Sequential Combination of Baseline Grammars and Machine Learning Classifiers",
"OpenCCG Workbench and Visualization Tool",
"Ontology-Based Interface Specifications for a NLP Pipeline Architecture",
"Exploring and Navigating: Tools for GermaNet",
"Evaluation of several Maximum Likelihood Linear Regression Variants for Language Adaptation.",
"The BNC Parsed with RASP4UIMA",
"Towards a Glossary of Activities in the Ontology Engineering Field",
"Extended Named Entity Ontology with Attribute Information",
"Using the Web as a Linguistic Resource to Automatically Correct Lexico-Syntactic Errors",
"Conceptual Modeling of Ontology-based Linguistic Resources with a Focus on Semantic Relations",
"ISOcat: Corralling Data Categories in the Wild",
"BioSec Multimodal Biometric Database in Text-Dependent Speaker Recognition",
"I saw TREE trees in the park: How to Correct Real-Word Spelling Mistakes",
"An Automatic Close Copy Speech Synthesis Tool for Large-Scale Speech Corpus Evaluation",
"Building a Corpus of Temporal-Causal Structure",
"Bilingual Text Classification using the IBM 1 Translation Model",
"Ontologizing Lexicon Access Functions based on an LMF-based Lexicon Taxonomy",
"Annotating Superlatives",
"A Semantic Memory for Incremental Ontology Population",
"Improving Contextual Quality Models for MT Evaluation Based on Evaluators&#146; Feedback",
"A Fully Annotated Corpus for Studying the Effect of Cognitive Ageing on Users&#146; Interactions with Spoken Dialogue Systems",
"A Multimodal Infant Behavior Annotation for Developmental Analysis of Demonstrative Expressions",
"Controlling Redundancy in Referring Expressions",
"An Inverted Index for Storing and Retrieving Grammatical Dependencies",
"A Flexible Wizard of Oz Environment for Rapid Prototyping",
"BART: A modular toolkit for coreference resolution",
"Evaluating Robustness Of A QA System Through A Corpus Of Real-Life Questions",
"Evaluation of Lexical Resources and Semantic Networks on a Corpus of Mental Associations",
"Lexical Resources for Automatic Translation of Constructed Neologisms: the Case Study of Relational Adjectives",
"A Comparative Study on Language Identification Methods",
"A Question Answering System for German. Experiments with Morphological Linguistic Resources",
"Building a Golden Collection of Parallel Multi-Language Word Alignment",
"POS Tagging for German: how important is the Right Context?",
"Children&#146;s Oral Reading Corpus (CHOREC): Description and Assessment of Annotator Agreement",
"Integrating Lexical Units, Synsets and Ontology in the Cornetto Database",
"Semantic Frame Annotation on the French MEDIA corpus",
"A Proper Approach to Japanese Morphological Analysis: Dictionary, Model, and Evaluation",
"Word Alignment Annotation in a Japanese-Chinese Parallel Corpus",
"The Annotation Guidelines of the Latin Dependency Treebank and Index Thomisticus Treebank: the Treatment of some specific Syntactic Constructions in Latin",
"Ontology Search with the OntoSelect Ontology Library",
"Semi-automatic Building Method for a Multidimensional Affect Dictionary for a New Language",
"Structural Metadata Annotation of Speech Corpora: Comparing Broadcast News and Broadcast Conversations",
"A Framework for Multilingual Ontology Mapping",
"Measures for Term and Sentence Relevances: an Evaluation for German",
"Evaluating Evaluation Metrics for Ontology-Based Applications: Infinite Reflection",
"Spelling Correction: from Two-Level Morphology to Open Source",
"Lexical Substitution as a Framework for Multiword Evaluation",
"Sentiment Analysis and the Use of Extrinsic Datasets in Evaluation",
"Manual vs Assisted Transcription of Prepared and Spontaneous Speech",
"LILA: Cellular Telephone Speech Databases from Asia",
"Evaluating Dialogue Act Tagging with Naive and Expert Annotators",
"Certification and Cleaning up of a Text Corpus: Towards an Evaluation of the &#147;Grammatical&#148; Quality of a Corpus",
"Harvesting Multi-Word Expressions from Parallel Corpora",
"Developing a Phonemic and Syllabic Frequency Inventory for Spontaneous Spoken Castilian Spanish and their Comparison to Text-Based Inventories",
"Yet another Platform for Extracting Knowledge from Corpora",
"UnsuParse: unsupervised Parsing with unsupervised Part of Speech Tagging",
"Benchmark Databases for Video-Based Automatic Sign Language Recognition",
"Acquiring Naturalistic Concept Descriptions from the Web",
"What would you Ask a conversational Agent? Observations of Human-Agent Dialogues in a Museum Setting",
"The 2008 Oriental COCOSDA Book Project: in Commemoration of the First Decade of Sustained Activities in Asia",
"Validating the Quality of Full Morphological Annotation",
"A Ground Truth Dataset for Matching Culturally Diverse Romanized Person Names",
"Using Log-linear Models for Tuning Machine Translation Output",
"MISTRAL: a Statistical Machine Translation Decoder for Speech Recognition Lattices",
"Using Semantically Annotated Corpora to Build Collocation Resources",
"Statistical Identification of English Loanwords in Korean Using Automatically Generated Training Data",
"A Suite to Compile and Analyze an LSP Corpus",
"Anaphoric Annotation in the ARRAU Corpus",
"Translation Adequacy and Preference Evaluation Tool (TAP-ET)",
"Semantic Vectors: a Scalable Open Source Package and Online Technology Management Application",
"Division of Example Sentences Based on the Meaning of a Target Word Using Semi-Supervised Clustering",
"Is this NE tagger getting old?",
"CzEng 0.7: Parallel Corpus with Community-Supplied Translations",
"Similar Term Discovery using Web Search",
"Toward Active Learning in Data Selection: Automatic Discovery of Language Features During Elicitation",
"Unsupervised Parts-of-Speech Induction for Bengali",
"Process Model for Composing High-quality Text Corpora",
"Babylon Parallel Text Builder: Gathering Parallel Texts for Low-Density Languages",
"Computational Models for Event Type Classification in Context",
"Design and Recording of Czech Audio-Visual Database with Impaired Conditions for Continuous Speech Recognition",
"CLARIN: Common Language Resources and Technology Infrastructure",
"Thai Broadcast News Corpus Construction and Evaluation",
"Geo-WordNet: Automatic Georeferencing of WordNet",
"Coding Emotional Events in Audiovisual Corpora",
"Tools for Collocation Extraction: Preferences for Active vs. Passive",
"BOEMIE Ontology-Based Text Annotation Tool",
"JURISDIC: Polish Speech Database for Taking Dictation of Legal Texts",
"Audio Database in Support of Potentiel Threat and Crisis Situation Management",
"Condensing Sentences for Subtitle Generation",
"Building of a Speech Corpus Optimised for Unit Selection TTS Synthesis",
"Evaluation of Modules and Tools for Speech Synthesis: the ECESS Framework",
"A Common Multimedia Annotation Framework for Cross Linking Cultural Heritage Digital Collections",
"CORP-ORAL: Spontaneous Speech Corpus for European Portuguese",
"Automatic Acquisition for low frequency lexical items",
"Approximating Learning Curves for Active-Learning-Driven Annotation",
"Emotion Recognition from Speech: Stress Experiment",
"A Common Parts-of-Speech Tagset Framework for Indian Languages",
"Generalising Lexical Translation Strategies for MT Using Comparable Corpora",
"Named Entity Recognition for Digitised Historical Texts",
"Annotating an Arabic Learner Corpus for Error",
"A Multi-sensor Speech Database with Applications towards Robust Speech Processing in hostile Environments",
"Tagging Spanish Texts: the Problem of Problem of &#147;SE&#148;",
"Integration of a Multilingual Keyword Extractor in a Document Management System",
"A Framework for Identity Resolution and Merging for Multi-source Information Extraction",
"Tree Distance and Some Other Variants of Evalb",
"Some Fine Points of Hybrid Natural Language Parsing",
"Using the Multilingual Central Repository for Graph-Based Word Sense Disambiguation",
"Making Text Resources Accessible to the Reader: the Case of Patent Claims",
"Dictionary of Multiword Expressions for Translation into highly Inflected Languages",
"A Knowledge-Modeling Approach for Multilingual Regulus Lexica",
"LC-STAR II: Starring more Lexica",
"The LECTRA Corpus - Classroom Lecture Transcriptions in European Portuguese",
"AnCora: Multilevel Annotated Corpora for Catalan and Spanish",
"Word-Based or Morpheme-Based? Annotation Strategies for Modern Hebrew Clitics",
"A Japanese-English Technical Lexicon for Translation and Language Research",
"Foundation of a Component-based Flexible Registry for Language Resources and Technology",
"From D-Coi to SoNaR: a reference corpus for Dutch",
"Recording Speech of Children, Non-Natives and Elderly People for HLT Applications: the JASMIN-CGN Corpus.",
"Influence of Text Type and Text Length on Anaphoric Annotation",
"Building a Federation of Language Resource Repositories: the DAM-LR Project and its Continuation within CLARIN.",
"KYOTO: a System for Mining, Structuring and Distributing Knowledge across Languages and Cultures",
"Domain-Specific English-To-Spanish Translation of FrameNet",
"A Grid of Regional Language Archives",
"Enriching Frame Semantic Resources with Dependency Graphs",
"A Multi-Word Term Extraction Program for Arabic Language",
"Professor or Screaming Beast? Detecting Anomalous Words in Chinese",
"Language-Sites: Accessing and Presenting Language Resources via Geographic Information Systems",
"BLEU+: a Tool for Fine-Grained BLEU Computation",
"Experiments to Investigate the Connection between Case Distribution and Topical Relevance of Search Terms in an Information Retrieval Setting",
"Scaling Answer Type Detection to Large Hierarchies",
"The Dutch-Flemish Comprehensive Approach to HLT Stimulation and Innovation: STEVIN, HLT Agency and beyond",
"Identifying Strategic Information from Scientific Articles through Sentence Classification",
"Hydra: a Modal Logic Tool for Wordnet Development, Validation and Exploration",
"Ping-pong Document Clustering using NMF and Linkage-Based Refinement",
"Complete and Consistent Annotation of WordNet using the Top Concept Ontology",
"The Automatic Mapping of Princeton WordNet Lexical-Conceptual Relations onto the Brazilian Portuguese WordNet Database",
"Communicating Unknown Words in Machine Translation",
"Semantic Role Labeling Tools Trained on the Cast3LB-CoNNL-SemRol Corpus",
"How to Evaluate and Raise the Quality in a Collaborative Lexicographic Approach",
"Verb-Noun Collocation SyntLex Dictionary: Corpus-Based Approach",
"Odds of Successful Transfer of Low-Level Concepts: a Key Metric for Bidirectional Speech-to-Speech Machine Translation in DARPA&#146;s TRANSTAC Program",
"Creation of Learner Corpus and Its Application to Speech Recognition",
"Test Collections for Spoken Document Retrieval from Lecture Audio Data",
"Keywords, k-NN and Neural Networks: a Support for Hierarchical Categorization of Texts in Brazilian Portuguese",
"Post-MT Term Swapper: Supplementing a Statistical Machine Translation System with a User Dictionary",
"Temporal Aspects of Terminology for Automatic Term Recognition: Case Study on Women&#146;s Studies Terms",
"A Contextual Dynamic Network Model for WSD Using Associative Concept Dictionary",
"Automatic Extraction of Textual Elements from News Web Pages",
"Elicited Imitation as an Oral Proficiency Measure with ASR Scoring",
"Extraction of Informative Expressions from Domain-specific Documents",
"Boot-Strapping a WordNet Using Multiple Existing WordNets",
"Opinion Annotation in On-line Chinese Product Reviews",
"Unsupervised and Domain Independent Ontology Learning: Combining Heterogeneous Sources of Evidence",
"ALC: Alcohol Language Corpus",
"Extracting Lexical Semantic Knowledge from Wikipedia and Wiktionary",
"Phone Segmentation Tool with Integrated Pronunciation Lexicon and Czech Phonetically Labelled Reference Database.",
"Adapting International Standard for Asian Language Technologies",
"Building Bilingual Lexicons using Lexical Translation Probabilities via Pivot Languages",
"The European Thesaurus on International Relations and Area Studies - a Multilingual Resource for Indexing, Retrieval, and Translation",
"Unsupervised Relation Extraction From Web Documents",
"Building a Greek corpus for Textual Entailment",
"Construction of a Metadata Database for Efficient Development and Use of Language Resources",
"The Extended Architecture of Hantology for Japan Kanji",
"COLDIC, a Lexicographic Platform for LMF compliant lexica",
"Extraction of Attribute Concepts from Japanese Adjectives",
"Arabic WordNet: Semi-automatic Extensions using Bayesian Inference",
"Merging a Syntactic Resource with a WordNet: a Feasibility Study of a Merge between STO and DanNet",
"Subjective Evaluation of an Emotional Speech Database for Basque",
"Revealing Relations between Open and Closed Answers in Questionnaires through Text Clustering Evaluation",
"Standardising Bilingual Lexical Resources According to the Lexicon Markup Framework",
"Representation of Atypical Entities in Ontologies",
"Constructing a Database of Non-Japanese Pronunciations of Different Japanese Romanizations",
"Connecting Text Mining and Pathways using the PathText Resource",
"Developing Non-European Translation Pairs in a Medium-Vocabulary Medical Speech Translation System",
"Using Reordering in Statistical Machine Translation based on Alignment Block Classification",
"The ACL Anthology Reference Corpus: A Reference Dataset for Bibliographic Research in Computational Linguistics",
"ASV Toolbox: a Modular Collection of Language Exploration Tools",
"Integrating Audio and Visual Information for Modelling Communicative Behaviours Perceived as Different",
"Creating and Exploiting Multimodal Annotated Corpora",
"Automatic Identification of Temporal Information in Tourism Web Pages",
"WNTERM: Enriching the MCR with a Terminological Dictionary",
"Design of a Multimodal Database for Research on Automatic Detection of Severe Apnoea Cases",
"Combined Systems for Automatic Phonetic Transcription of Proper Nouns",
"Producing a Test Collection for Patent Machine Translation in the Seventh NTCIR Workshop",
"Corpus-based Semantic Relatedness for the Construction of Polish WordNet",
"Combining Multiple Models for Speech Information Retrieval",
"Learning the Species of Biomedical Named Entities from Annotated Corpora",
"Text Independent Speaker Identification in Multilingual Environments",
"Mutual Bilingual Terminology Extraction",
"Using Parsed Corpora for Estimating Stochastic Inversion Transduction Grammars",
"Evaluation Framework for Distant-talking Speech Recognition under Reverberant Environments: newest Part of the CENSREC Series -",
"The Japanese FrameNet Software Tools",
"A Dependency Parser for Thai",
"Mapping Events and Abstract Entities from PAROLE-SIMPLE-CLIPS to ItalWordNet",
"In-car Speech Data Collection along with Various Multimodal Signals",
"Corpus Co-Occurrence, Dictionary and Wikipedia Entries as Resources for Semantic Relatedness Information",
"Identification of Comparable Argument-Head Relations in Parallel Corpora",
"All, and only, the Errors: more Complete and Consistent Spelling and OCR-Error Correction Evaluation",
"Language Resources for Semantic Document Annotation and Crosslingual Retrieval",
"Corpus-Based Tools for Computer-Assisted Acquisition of Reading Abilities in Cognate Languages",
"Detecting Co-Derivative Documents in Large Text Collections",
"Robust Parsing with a Large HPSG Grammar",
"Towards Heterogeneous Automatic MT Error Analysis",
"Synchronizing Translated Movie Subtitles",
"RUNDKAST: an Annotated Norwegian Broadcast News Speech Corpus",
"Error Analysis for Learning-based Coreference Resolution",
"The AUTONOMATA Spoken Names Corpus",
"Enriching the Venice Italian Treebank with Dependency and Grammatical Relations",
"Developing Verb Frames for Hindi",
"Word Segmentation of Vietnamese Texts: a Comparison of Approaches",
"Romanian Lexical Data Bases: Inflected and Syllabic Forms Dictionaries",
"GENIA-GR: a Grammatical Relation Corpus for Parser Evaluation in the Biomedical Domain",
"Active Annotation in the LUNA Italian Corpus of Spontaneous Dialogues",
"A Coreference Corpus and Resolution System for Dutch",
"A Hybrid Approach to Extracting and Classifying Verb+Noun Constructions",
"Extracting Concrete Senses of Lexicon through Measurement of Conceptual Similarity in Ontologies",
"Cross-Domain Dialogue Act Tagging",
"Spatiotemporal Annotation Using MiniSTEx: how to deal with Alternative, Foreign, Vague and/or Obsolete Names?",
"User-Centred Design of Error Correction Tools",
"Evaluation Metrics for Automatic Temporal Annotation of Texts",
"Talking and Looking: the SmartWeb Multimodal Interaction Corpus",
"Question Answering on Speech Transcriptions: the QAST evaluation in CLEF",
"Constructing a Corpus that Indicates Patterns of Modification between Draft and Final Translations by Human Translators",
"Learning Patterns for Building Resources about Semantic Relations in the Medical Domain",
"Clustering Related Terms with Definitions",
"Exploiting Multiply Annotated Corpora in Biomedical Information Extraction Tasks",
"From Human Communication to Intelligent User Interfaces: Corpora of Spoken Estonian",
"Producing an Encyclopedic Dictionary using Patent Documents",
"Enriching GermaNet with verb-noun relations - a case study of lexical acquisition",
"Evaluation of Spoken Document Retrieval for Historic Speech Collections",
"Spatiotemporal Coding in ANVIL",
"Annotating Abstract Pronominal Anaphora in the DAD Project",
"Extraction and Evaluation of Keywords from Learning Objects: a Multilingual Approach",
"Developing Corpus of Japanese Classroom Lecture Speech Contents",
"Comparing Italian parsers on a common Treebank: the EVALITA experience",
"MaltEval: an Evaluation and Visualization Tool for Dependency Parsing",
"JMWNL: an Extensible Multilingual Library for Accessing Wordnets in Different Languages",
"Ontology Learning and Semantic Annotation: a Necessary Symbiosis",
"Applying Automated Metrics to Speech Translation Dialogs",
"Automatic extraction of subcategorization frames for Italian",
"Evaluating a German Sketch Grammar: A Case Study on Noun Phrase Case",
"A Comparative Evaluation of Term Recognition Algorithms",
"Evaluation of a Cross-lingual Romanian-English Multi-document Summariser",
"Exploiting the Role of Position Feature in Chinese Relation Extraction",
"Corpus Exploitation from Wikipedia for Ontology Construction",
"Sensitivity of Automated MT Evaluation Metrics on Higher Quality MT Output: BLEU vs Task-Based Evaluation Methods",
"Annotation of Information Structure: an Evaluation across different Types of Texts",
"Acquiring a Taxonomy from the German Wikipedia",
"The ATCOSIM Corpus of Non-Prompted Clean Air Traffic Control Speech",
"An Empirical Approach to a Preliminary Successful Identification and Resolution of Temporal Expressions in Spanish News Corpora",
"Building a Bio-Event Annotated Corpus for the Acquisition of Semantic Frames from Biomedical Corpora",
"A Multi-Genre SMT System for Arabic to French",
"DIAC+: a Professional Diacritics Recovering System",
"Dialogue, Speech and Images: the Companions Project Data Set",
"Entity Translation and Alignment in the ACE-07 ET Task",
"Authorship Attribution of E-Mail: Comparing Classifiers over a New Corpus for Evaluation",
"Slovene Terminology Web Portal and the TBX-Compatible Simplified DTD/schema",
"Speech Errors on Frequently Observed Homophones in French: Perceptual Evaluation vs Automatic Classification",
"Language Resources and Chemical Informatics",
"The MoveOn Motorcycle Speech Corpus",
"Relationships between Nursing Converstaions and Activities",
"Evaluating the Relationship between Linguistic and Geographic Distances using a 3D Visualization",
"Acquiring Pronunciation Data for a Placenames Lexicon in a Less-Resourced Language",
"Using a Probabilistic Model of Context to Detect Word Obfuscation",
"Development and Alignment of a Domain-Specific Ontology for Question Answering",
"A Web Browser Extension for Growing-up Ontological Knowledge from Traditional Web Content",
"A Large-Scale Web Data Collection as a Natural Language Processing Infrastructure",
"Creating a Research Collection of Question Answer Sentence Pairs with Amazon&#146;s Mechanical Turk",
"Annotating Expressions of Opinion and Emotion in the Italian Content Annotation Bank",
"Frame Information Transfer from English to Italian",
"Semantic Annotations for Biology: a Corpus Development Initiative at the Jena University Language & Information Engineering (JULIE) Lab",
"A LAF/GrAF based Encoding Scheme for underspecified Representations of syntactic Annotations.",
"Unsupervised Lexical Acquisition for Part of Speech Tagging",
"WEB-Based Listening Test System for Speech Synthesis and Speech Conversion Evaluation",
"F0 of Adolescent Speakers – First Results for the German Ph@ttSessionz Database",
"Automatic Emotional Degree Labeling for Speakers&#146; Anger Utterance during Natural Japanese Dialog",
"A lexicon for biology and bioinformatics: the BOOTStrep experience.",
"A Bottom-up Comparative Study of EuroWordNet and WordNet 3.0 Lexical and Semantic Relations",
"Building the Valency Lexicon of Arabic Verbs",
"Design and Data Collection for Spoken Polish Dialogs Database",
"Task-Based Evaluation of Meeting Browsers: from Task Elicitation to User Behavior Analysis",
"Semantically Annotated Snapshot of the English Wikipedia",
"Methodology for Evaluating the Usability of User Interfaces in Mobile Services",
"How to Compare Treebanks",
"WOZ Acoustic Data Collection for Interactive TV",
"Using Random Indexing to improve Singular Value Decomposition for Latent Semantic Analysis",
"Parallel Multi-Theory Annotations of Syntactic Structure",
"Chinese Core Ontology Construction from a Bilingual Term Bank",
"ANAWIKI: Creating Anaphorically Annotated Resources through Web Cooperation",
"Automatic Learning and Evaluation of User-Centered Objective Functions for Dialogue System Optimisation",
"Learning Morphology with Morfette",
"L-ISA: Learning Domain Specific Isa-Relations from the Web",
"Automatic Phone Segmentation of Expressive Speech",
"Simple-Clips ongoing research: more information with less data by implementing inheritance",
"Supersense Tagger for Italian",
"Vox Populi Annotation: Measuring Intensity of Ideological Perspectives by Aggregating Group Judgments",
"Towards Spanish Verbs&#146; Selectional Preferences Automatic Acquisition: Semantic Annotation of the SenSem Corpus",
"Automatic Phoneme Segmentation with Relaxed Textual Constraints",
"Challenges in Pronoun Resolution System for Biomedical Text",
"LMM: an OWL-DL MetaModel to Represent Heterogeneous Lexical Knowledge",
"Development of the Japanese WordNet",
"From Extracting to Abstracting: Generating Quasi-abstractive Summaries",
"A Bilingual Corpus of Inter-linked Events",
"Lexical Ontology Extraction using Terminology Analysis: Automating Video Annotation",
"Estimating Word Phonosemantics",
"The PIT Corpus of German Multi-Party Dialogues",
"Adaptation of Relation Extraction Rules to New Domains",
"An Economic View on Human Language Technology Evaluation",
"MASC: the Manually Annotated Sub-Corpus of American English",
"Boosting Precision and Recall of Hyponymy Relation Acquisition from Hierarchical Layouts in Wikipedia",
"Lexical Resources for Semantics Extraction",
"Event Detection and Summarization in Weblogs with Temporal Collocations",
"Building Mobile Spoken Dialogue Applications Using Regulus",
"EASY, Evaluation of Parsers of French: what are the Results?",
"CLIoS: Cross-lingual Induction of Speech Recognition Grammars",
"Encoding Terms from a Scientific Domain in a Terminological Database: Methodology and Criteria",
"Workbench with Authoring Tools for Collaborative Multi-lingual Ontological Knowledge Construction and Maintenance",
"Improving NER in Arabic Using a Morphological Tagger",
"Building a Bilingual Representation of the Roget Thesaurus for French to English Machine Translation",
"Using Lexical Acquisition to Enrich a Predicate Argument Reusable Database",
"The QALL-ME Benchmark: a Multilingual Resource of Annotated Spoken Requests for Question Answering",
"Clustering of Terms from Translation Dictionaries and Synonyms Lists to Automatically Build more Structured Linguistic Resources",
"Spectral Clustering for a Large Data Set by Reducing the Similarity Matrix Size",
"Evaluation of Natural Language Tools for Italian: EVALITA 2007",
"Rule-Based Chunker for Croatian",
"Data Collection for the CHIL CLEAR 2007 Evaluation Campaign",
"Identifying Foreign Person Names in Chinese Text",
"From Sentence to Discourse: Building an Annotation Scheme for Discourse Based on Prague Dependency Treebank",
"SECTra_w.1: an Online Collaborative System for Evaluating, Post-editing and Presenting MT Translation Corpora",
"LX-Service: Web Services of Language Technology for Portuguese",
"Generating Bilingual Dictionaries by Transitivity",
"Experimental Fast-Tracking of Morphological Analysers for Nguni Languages",
"Learning properties of Noun Phrases: from data to functions",
"The TextPro Tool Suite",
"Adjudicator Agreement and System Rankings for Person Name Search",
"Language Resources for Studying Argument",
"A Text-based Query Interface to OWL Ontologies",
"Enhancing an English-Polish Electronic Dictionary for Multiword Expression Research",
"CallSurf: Automatic Transcription, Indexing and Structuration of Call Center Conversational Speech for Knowledge Extraction and Query by Content",
"Towards Semi Automatic Construction of a Lexical Ontology for Persian",
"UFRA: a UIMA-based Approach to Federated Language Resource Architecture",
"Evaluating the Ontology underlying sMail - the Conceptual Framework for Semantic Email Communication",
"The UJIpenchars Database: a Pen-Based Database of Isolated Handwritten Characters",
"Parameters for Topic Boundary Detection in Multi-Party Dialogues",
"First Broadcast News Transcription System for Khmer Language",
"Targeting Chinese Nominal Compounds in Corpora",
"A Study of Parentheticals in Discourse Corpora - Implications for NLG Systems",
"A Real-World Emotional Speech Corpus for Modern Greek",
"A Three-stage Disfluency Classifier for Multi Party Dialogues",
"Reusable Tagset Conversion Using Tagset Drivers",
"Semiotic-based Ontology Evaluation Tool (S-OntoEval)",
"Comparing Corpus-based to Web-based Lookup Techniques for Automatic English Inclusion Detection",
"Centering Theory for Evaluation of Coherence in Computer-Aided Summaries",
"Linguistic Resources and Evaluation Techniques for Evaluation of Cross-Document Automatic Content Extraction",
"Fine-grained Opinion Topic and Polarity Identification",
"Holy Moses! Leveraging Existing Tools and Resources for Entity Translation",
"The Usage of Various Lexical Resources and Tools to Improve the Performance of Web Search Engines",
"Deriving Rhetorical Complexity Data from the RST-DT Corpus",
"Quality Assurance of Automatic Annotation of Very Large Corpora: a Study based on heterogeneous Tagging System",
"Borrowing Language Resources for Development of Automatic Speech Recognition for Low- and Middle-Density Languages",
"Evaluating Complement-Modifier Distinctions in a Semantically Annotated Corpus",
"Annotating Subjective Content in Meetings",
"Inter-sentential Coreferences in Semantic Networks: An Evaluation of Manual Annotation",
"Semantic Press",
"An eRulemaking Corpus: Identifying Substantive Issues in Public Comments",
"Tools & Resources for Visualising Conversational-Speech Interaction",
"A Bootstrapping Method for Building Subjectivity Lexicons for Languages with Scarce Resources",
"An Approach to Modeling Heterogeneous Resources for Information Extraction",
"Diacritic Annotation in the Arabic Treebank and its Impact on Parser Evaluation",
"On the Durational Reduction of Repeated Mentions: Recency and Speaker Effects",
"Finding the Sources and Targets of Subjective Expressions",
"Resources for Persuasion",
"Evaluation of Virtual Keyboards for West-African Languages",
"Annotation of WordNet Verbs with TimeML Event Classes",
"Anaphora Resolution Exercise: an Overview",
"Romanian Semantic Role Resource",
"Generating a Morphological Lexicon of Organization Entity Names",
"Using Similarity Metrics For Terminology Recognition",
"Minding the Source: Automatic Tagging of Reported Speech in Newspaper Articles",
"Valentino: A Tool for Valence Shifting of Natural Language Texts",
"Knowledge Sources for Bridging Resolution in Multi-Party Dialog",
"Let&#146;s not Argue about Semantics",
"Relation between Agreement Measures on Human Labeling and Machine Learning Performance: Results from an Art History Domain",
"ProPOSEL: A Prosody and POS English Lexicon for Language Engineering",
"Linguistic Structure and Bilingual Informants Help Induce Machine Translation of Lesser-Resourced Languages",
"Dependency-Based Relation Mining for Biomedical Literature",
"memasysco: XML schema based metadata management system for speech corpora",
"Chinese Term Extraction Based on Delimiters",
"On Classifying Coherent/Incoherent Romanian Short Texts",
"Improving Statistical Machine Translation Efficiency by Triangulation",
"A Linguistic Resource for Discovering Event Structures and Resolving Event Coreference",
"NineOneOne: Recognizing and Classifying Speech for Handling Minority Language Emergency Calls",
"Sentiment Analysis Based on Probabilistic Models Using Inter-Sentence Information",
"Automatic Rewriting of Patient Record Narratives",
"Converting Romanized Persian to the Arabic Writing Systems",
"Treebank-Based Acquisition of LFG Parsing Resources for French",
"What&#146;s in a Colour? Studying and Contrasting Colours with COMPARA",
"Production in a Multimodal Corpus: how Speakers Communicate Complex Actions",
"Methodologies for Designing and Recording Speech Databases for Corpus Based Synthesis",
"Linguistic Description and Automatic Extraction of Definitions from German Court Decisions",
"Characterization of Scientific and Popular Science Discourse in French, Japanese and Russian",
"Czech MWE Database",
"The ATIS Sign Language Corpus",
"A Comparison of Various Methods for Concept Tagging for Spoken Language Understanding",
"Comparing Set-Covering Strategies for Optimal Corpus Design",
"Management of Large Annotation Projects Involving Multiple Human Judges: a Case Study of GALE Machine Translation Post-editing",
"The Penn Discourse TreeBank 2.0.",
"The Linguistic Data Consortium Member Survey: Purpose, Execution and Results",
"Combining Terminology Resources and Statistical Methods for Entity Recognition: an Evaluation",
"Personae: a Corpus for Author and Personality Prediction from Text",
"In Contrast - A Complex Discourse Connective",
"Portuguese-English Word Alignment: some Experiments",
"A Corpus for Cross-Document Co-reference",
"Unsupervised Acquisition of Verb Subcategorization Frames from Shallow-Parsed Corpora",
"System Evaluation on a Named Entity Corpus from Clinical Notes",
"Knowledge-based Coreference Resolution for Hungarian",
"Navigating through Dense Annotation Spaces",
"Using Movie Subtitles for Creating a Large-Scale Bilingual Corpora",
"A Framework for Standardized Syntactic Annotation",
"Creating and Using a Correlated Corpus to Glean Communicative Commonalities",
"New Resources for Document Classification, Analysis and Translation Technologies",
"Extracting and Querying Relations in Scientific Papers on Language Technology",
"Parser Evaluation and the BNC: Evaluating 4 constituency parsers with 3 metrics",
"Annotation Tool Development for Large-Scale Corpus Creation Projects at the Linguistic Data Consortium",
"Experiments on Processing Overlapping Parallel Corpora",
"An AI-inspired intelligent agent/student architecture to combine Language Resources research and teaching",
"Creating Sentence-Aligned Parallel Text Corpora from a Large Archive of Potential Parallel Text using BITS and Champollion",
"A Multilingual Database of Polarity Items",
"Application of Resource-based Machine Translation to Real Business Scenes",
"Creating Glossaries Using Pattern-Based and Machine Learning Techniques",
"The Construction and Evaluation of Word Space Models",
"Automatic Evaluation Measures for Statistical Machine Translation System Optimization",
"The Pronouncing Dictionary of Austrian German (AGPD) and the Austrian Phonetic Database (ADABA): Report on a large Phonetic Resources Database of the three Major Varieties of German",
"Strengthening the Estonian Language Technology",
"Annotation and analysis of overlapping speech in political interviews",
"Projecting Propbank Roles onto the CCGbank",
"Designing and Evaluating a Russian Tagset",
"Word-level Dependency-structure Annotation to Corpus of Spontaneous Japanese and its Application",
"Phrase-Based Machine Translation based on Simulated Annealing",
"Bridging the Gap between Linguists and Technology Developers: Large-Scale, Sociolinguistic Annotation for Dialect and Speaker Recognition",
"Evaluating and Extending the Coverage of HPSG Grammars: A Case Study for German",
"The Italian Particle &#147;ne&#148;: Corpus Construction and Analysis",
"Constructing Evaluation Corpora for Automated Clinical Named Entity Recognition",
"Can we Evaluate the Quality of Generated Text?",
"Induction of Treebank-Aligned Lexical Resources",
"What is poorly Said is a Little Funny",
"A General Methodology for Mapping EuroWordNets to the Suggested Upper Merged Ontology",
"Tagging a Hebrew Corpus: the Case of Participles",
"Collection and Preprocessing of Czech Sign Language Corpus for Sign Language Recognition",
"An Infrastructure, Tools and Methodology for Evaluation of Multicultural Name Matching Systems",
"German Today: a really extensive Corpus of Spoken Standard German",
"Enhancing the Arabic Treebank: a Collaborative Effort toward New Annotation Guidelines",
"A Common Ground for Virtual Humans: Using an Ontology in a Natural Language Oriented Virtual Human Architecture",
"Lexicon Schemas and Related Data Models: when Standards Meet Users",
"Annotating Topics of Opinions",
"Answering List Questions using Co-occurrence and Clustering",
"A Comparative Cross-Domain Study of the Occurrence of Laughter in Meeting and Seminar Corpora",
"Building a Multilingual Lexical Resource for Named Entity Disambiguation, Translation and Transliteration",
"GMT to +2 or how can TimeML be used in Romanian",
"Modelling Word Similarity: an Evaluation of Automatic Synonymy Extraction Algorithms.",
"Information Extraction Tools and Methods for Understanding Dialogue in a Companion",
"A Development Environment for Configurable Meta-Annotators in a Pipelined NLP Architecture",
"Lexicon, Grammar, and Multilinguality in the Japanese FrameNet",
"Translation-oriented Word Sense Induction Based on Parallel Corpora",
"Using Similarity Measures to Extend the LinGO Lexicon",
"An Evaluation of Spoken and Textual Interaction in the RITEL Interactive Question Answering System",
"Smarty - Extendable Framework for Bilingual and Multilingual Comprehension Assistants",
"Low-Density Language Bootstrapping: the Case of Tajiki Persian",
"Pragmatic Annotation of Discourse Markers in a Multilingual Parallel Corpus (Arabic- Spanish-English)",
"Mapping Roget&#146;s Thesaurus and WordNet to French",
"A Method for Automatically Constructing Case Frames for English",
"Assessing the Costs of Machine-Assisted Corpus Annotation through a User Study",
"Corpus and Voices for Catalan Speech Synthesis",
"Unsupervised Learning-based Anomalous Arabic Text Detection",
"Identification of Naturally Occurring Numerical Expressions in Arabic",
"MTriage: Web-enabled Software for the Creation, Machine Translation, and Annotation of Smart Documents",
"Hungarian Word-Sense Disambiguated Corpus",
"Bootstrapping Language Description: the case of Mpiemo (Bantu A, Central African Republic)",
"Semantic Annotation Layer in Russian National Corpus: Lexical Classes of Nouns and Adjectives",
"A Conceptual Approach to Web Image Retrieval",
"A Unified Database of Dependency Treebanks: Integrating, Quantifying & Evaluating Dependency Data",
"Developments of &#147;L&#235tzebuergesch&#148; Resources for Automatic Speech Processing and Linguistic Studies",
"Training and Evaluation of POS Taggers on the French MULTITAG Corpus",
"Parallel Creation of Gigaword Corpora for Medium Density Languages - an Interim Report",
"Construction and Analysis of Word-level Time-aligned Simultaneous Interpretation Corpus",
"15 Years of Language Resource Creation and Sharing: a Progress Report on LDC Activities",
"Authorship Identification of Romanian Texts with Controversial Paternity",
"IrcamCorpusTools: an Extensible Platform for Spoken Corpora Exploitation",
"A Taxonomy of Lexical Metadata Categories",
"An Unsupervised Probabilistic Approach for the Detection of Outliers in Corpora",
"Acquiring a Poor Man&#146;s Inflectional Lexicon for German",
"ANNALIST - ANNotation ALIgnment and Scoring Tool",
"Evolutionary Basic Notions for a Thematic Representation of General Knowledge",
"Building an Annotated Corpus for Text Summarization and Question Answering",
"ODL: an Object Description Language for Lexical Information",
"Annotating Students&#146; Understanding of Science Concepts",
"Linguistic Resources for Reconstructing Spontaneous Speech Text",
"A Hybrid Morphology-Based POS Tagger for Persian",
"Annotating &#147;tense&#148; in a Tense-less Language",
"Causal Relation Extraction",
"A Pilot Arabic Propbank",
"Spock - a Spoken Corpus Client",
"Automated Subject Induction from Query Keywords through Wikipedia Categories and Subject Headings",
"Multimodal Spontaneous Expressive Speech Corpus for Hungarian",
"A Lightweight and Efficient Tool for Cleaning Web Pages",
"Low-Complexity Heuristics for Deriving Fine-Grained Classes of Named Entities from Web Textual Data",
"Exploitation of an Arabic Language Resource for Machine Translation Evaluation: using Buckwalter-based Lookup Tool to Augment CMU Alignment Algorithm",
"Head or Non-head? Semi-automatic Procedures for Extracting and Classifying Subcategorisation Properties of Compounds.",
"Using the Complexity of the Distribution of Lexical Elements as a Feature in Authorship Attribution",
"Estimating the Resource Adaption Cost from a Resource Rich Language to a Similar Resource Poor Language",
"Evaluation of Context-Dependent Phrasal Translation Lexicons for Statistical Machine Translation",
"A Guide for the Production of Reusable Language Resources",
"Latest Developments in ELRA&#146;s Services",
"The JOS Morphosyntactically Tagged Corpus of Slovene",
"An Evaluation Resource for Geographic Information Retrieval",
"An Experimental Methodology for an End-to-End Evaluation in Speech-to-Speech Translation",
"New Telephone Speech Databases for French: a Children Database and an optimized Adult Corpus",
"Speaker Recognition: Building the Mixer 4 and 5 Corpora",
"More Semantic Links in the SIMPLE-CLIPS Database",
"KnoFusius: a New Knowledge Fusion System for Interpretation of Gene Expression Data",
"The INFILE Project: a Crosslingual Filtering Systems Evaluation Campaign",
"PASSAGE: from French Parser Evaluation to Large Sized Treebank",
"Annotation of Nuggets and Relevance in GALE Distillation Evaluation",
"RACAI&#146;s Linguistic Web Services",
"Linguistically Light Lexical Extensions for Ontologies",
"Amazigh Language Terminology in Morocco or Management of a &#147;Multidimensional&#148; Variation",
"From Research to Application in Multilingual Information Access: the Contribution of Evaluation",
"Statistical Evaluation of Information Distillation Systems",
"Quick Rich Transcriptions of Arabic Broadcast News Speech Data",
"MEDAR: Collaboration between European and Mediterranean Arabic Partners to Support the Development of Language Technology for Arabic",
"Prolexbase: a Multilingual Relational Lexical Database of Proper Names",
"Words in Contexts: Digital Editions of Literary Journals in the &#147;AAC - Austrian Academy Corpus&#148;",
"Towards Formal Interpretation of Semantic Annotation",
"Towards a Reference Corpus of Web Genres for the Evaluation of Genre Identification Systems",
"An Exchange Format for Multimodal Annotations",
"A Research on Automatic Chinese Catchword Extraction",
"The Metadata-Database of a Next Generation Sustainability Web-Platform for Language Resources",
"Performance Evaluation of Speech Translation Systems"];
var doc_text=[
"This paper describes an attempt to use the information contained in VerbNet to obtain change of location inferences. We show that the information is a...",
"This paper describes a new speech corpus, STC-TIMIT, and discusses the process of design, development and its distribution through LDC. The STC-TIMIT ...",
"We report on the evaluation of the Norwegian-English MT prototype system LOGON. The system is rule-based and makes use of well-established frameworks ...",
"We introduce the corpus of United States Congressional bills from 1947 to 1998 for use by language research communities. The U.S. Policy Agenda Legisl...",
"SpatialML is an annotation scheme for marking up references to places in natural language. It covers both named and nominal references to places, grou...",
"As a first step to developing systems that enable non-native speakers to output near-perfect English sentences for given mixed English-Japanese senten...",
"In this paper, we discuss the integration of metaphor information into the RDF/OWL representation of EuroWordNet. First, the lexical database WordNet ...",
"The orthographical complexities of Chinese, Japanese, Korean (CJK) and Arabic pose a special challenge to developers of NLP applications. These diffic...",
"Applications of statistical Arabic NLP in general, and text mining in specific, along with the tools underneath perform much better as the statistical...",
"On many examples we present a query language of Netgraph - a fully graphical tool for searching in the Prague Dependency Treebank 2.0. To demonstrate ...",
"News articles about the same event published over time have properties that challenge NLP and IR applications. A cluster of such texts typically exhib...",
"In this paper we describe the METIS-II system and its evaluation on each of the language pairs: Dutch, German, Greek, and Spanish to English. The METI...",
"WCTAnalyze is a tool for storing, accessing and visually analyzing huge collections of temporally indexed data. It is motivated by applications in med...",
"In dialogue systems, it is necessary to decode the user input into semantically meaningful units. These semantical units, usually Dialogue Acts (DA), ...",
"This paper investigates the state of the art in automatic textual annotation tools, and examines the extent to which they are ready for use in the rea...",
"Modern statistical parsers are trained on large annotated corpora (treebanks). These treebanks usually consist of sentences addressing different subdo...",
"In this paper, we describe our work on building a parallel treebank for a less studied and typologically dissimilar language pair, namely Swedish and ...",
"We propose in this paper an automatic evaluation procedure based on a metric which could provide summary evaluation without human assistance. Our syst...",
"We address the question of which syntactic representation is best suited for role-semantic analysis of English in the FrameNet paradigm. We compare sy...",
"A wide spectrum of multilingual applications have aligned parallel corpora as their prerequisite. The aim of the project described in this paper is to...",
"Large repositories of life science data in the form of domain-specific literature and large specialised textual collections increase on a daily basis ...",
"Automatic sentiment analysis in texts has attracted considerable attention in recent years. Most of the approaches developed to classify texts or sent...",
"Research into spoken language has become more visual over the years. Both fundamental and applied research have progressively included gestures, gaze,...",
"We present a multi-lingual dictionary of dirty words. We have collected about 3,200 dirty words in several languages and built a database of these. Th...",
"We present a corpus of spoken dialogues between students and an adaptive Wizard-of-Oz tutoring system, in which student uncertainty was manually annot...",
"For a language pair such as Chinese and Korean that belong to entirely different language families in terms of typology and genealogy, finding the cor...",
"We present an approach for querying collections of heterogeneous linguistic corpora that are annotated on multiple layers using arbitrary XML-based ma...",
"This paper outlines the new resource technologies, products and applications that have been constructed during the development of a multi-modal (MM he...",
"This paper presents LexSchem - the first large, fully automatically acquired subcategorization lexicon for French verbs. The lexicon includes subcateg...",
"Several studies indicate that the level of predicate-argument structure is relevant for modeling prevalent phenomena in current textual entailment cor...",
"The availability of a huge mass of textual data in electronic format has increased the need for fast and accurate techniques for textual data processi...",
"This paper focuses on automatically improving the readability of documents. We explore mechanisms relating to content control that could be used (i) b...",
"This paper explores how a battery of unsupervised techniques can be used in order to create large, high-quality corpora for textual inference applicat...",
"This paper describes Eksairesis, a system for learning economic domain knowledge automatically from Modern Greek text. The knowledge is in the form of...",
"This paper reports on the creation of the multimodal NIMITEK corpus of affected behavior in human-machine interaction and its role in the development ...",
"Tokenization is one of the initial steps done for almost any text processing task. It is not particularly recognized as a challenging task for English...",
"In this paper, we investigate the use of a machine-learning based approach to the specific problem of scientific term detection in patient information...",
"Language models used in current automatic speech recognition systems are trained on general-purpose corpora and are therefore not relevant to transcri...",
"Language resources and tools to create and process these resources are necessary components in human language technology and natural language applicat...",
"We develop a method for detecting errors in semantic predicate-argument annotation, based on the variation n-gram error detection method. After establ...",
"This paper introduces Saxon, a rule-based document annotator that is capable of processing and annotating several document formats and media, both wit...",
"We describe a web-based corpus query system, Glossa, which combines the expressiveness of regular query languages with the user-friendliness of a grap...",
"With the information overload in the life sciences there is an increasing need for annotated corpora, particularly with biological and biomedical enti...",
"We outline a methodological classification for evaluation approaches of software in general. This classification was initiated partly owing to involve...",
"Recently, most of the research in NLP has concentrated on the creation of applications coping with textual entailment. However, there still exist very...",
"Cleaneval is a shared task and competitive evaluation on the topic of cleaning arbitrary web pages, with the goal of preparing web data for use as a c...",
"We describe the process of converting plain text cultural heritage data to elements of a domain-specific knowledge base, using general machine learnin...",
"Even though a wealth of speech data is available for the dialog systems research community, the particular field of situated language has yet to find ...",
"This paper describes a method of readability measurement of Japanese texts based on a newly compiled textbook corpus. The textbook corpus consists of ...",
"We describe ParsCit, a freely available, open-source implementation of a reference string parsing package. At the core of ParsCit is a trained conditi...",
"This paper deals with non manual gestures annotation involved in Sign Language within the context of automatic generation of Sign Language. We will ta...",
"Recently, language resources (LRs) are becoming indispensable for linguistic research. Unfortunately, it is not easy to find their usages by searching...",
"This paper describes the use of the CasSys platform in order to achieve the chunking of conversational speech transcripts by means of cascades of Unit...",
"In this paper, we present a simple yet efficient automatic system to translate biomedical terms. It mainly relies on a machine learning approach able ...",
"Texts generated by automatic speech recognition (ASR) systems have some specificities, related to the idiosyncrasies of oral productions or the princi...",
"This paper proposes a method of constructing a dictionary for a pair of languages from bilingual dictionaries between each of the languages and a thir...",
"The PARC 700 dependency bank has a number of features that would seem to make it less than optimally suited for its intended purpose, parser evaluatio...",
"One problem of data-driven answer extraction in open-domain factoid question answering is that the class distribution of labeled training data is fair...",
"Semantic roles have often proved to be useful labels for stating linguistic generalisations of various sorts. There is, however, a lack of agreement o...",
"The goal of this paper is to describe how adjectives are encoded in Cornetto, a semantic lexical database for Dutch. Cornetto combines two existing le...",
"Morphological query expansion and language-filtering words have proved to be valid methods when searching the web for content in Basque via APIs of co...",
"The paper presents a tool assisting manual annotation of linguistic data developed at the Department of Computational linguistics, IBL-BAS. Chooser is...",
"In this paper, we present the collection and analysis of a spoken dialogue corpus obtained from interactions of older and younger users with a smart-h...",
"This paper presents the automatic extension of Princeton WordNet with Named Entities (NEs). This new resource is called Named Entity WordNet. Our meth...",
"Computational terminology has notably evolved since the advent of computers. Regarding the extraction of terms in particular, a large number of resour...",
"Times have changed over the last ten years in terms of dictionary production. With the introduction of digital support and networking, the lifespan of...",
"The Berkeley FrameNet Project (BFN) is making an English lexical database called FrameNet, which describes syntactic and semantic properties of an Eng...",
"Discovering relations among Named Entities (NEs) from large corpora is both a challenging, as well as useful task in the domain of Natural Language Pr...",
"Most of the Web-based methods for lexicon augmenting consist in capturing global semantic features of the targeted domain in order to collect relevant...",
"In this paper, we present a comparison between two corpora acquired by means of two different techniques. The first corpus was acquired by means of th...",
"We show here the viability of a rapid deployment of a new language pair within the METIS architecture. In order to do it, we have benefited from the a...",
"Developing linguistic resources, in particular grammars, is known to be a complex task in itself, because of (amongst others) redundancy and consisten...",
"In this paper, we present an original framework to model frame semantic resources (namely, FrameNet) using minimal supervision. This framework can be ...",
"In this paper we present two large-scale verbal lexicons, AnCora-Verb-Ca for Catalan and AnCora-Verb-Es for Spanish, which are the basis for the seman...",
"In this paper, we describe a unifying approach to tackle data heterogeneity issues for lexica and related resources. We present LEXUS, our software th...",
"The &#147;download first, then process paradigm&#148; is still the predominant working method amongst the research community. The web-based paradigm, ...",
"We present the procedures we implemented to carry out system oriented evaluation of a syntax-based word aligner, ALIBI. While cross-corpus evaluation ...",
"The Data Category Registry is one of the ISO initiatives towards the establishment of standards for Language Resource management, creation and coding....",
"This paper presents ongoing work dedicated to parsing the textual structure of procedural texts. We propose here a model for the intructional structur...",
"Based on the idea that local contexts predict the same basic category across a language, we develop a simple method for comparing tagsets across corpo...",
"This paper presents a new corpus project, aiming at building a national corpus of Polish. What makes it different from a typical YACP (Yet Another Cor...",
"The paper presents Spejd, an Open Source Shallow Parsing and Disambiguation Engine. Spejd (abbreviated to &#9824;) is based on a fully uniform formali...",
"The paper deals with the task of definition extraction from a small and noisy corpus of instructive texts. Three approaches are presented: Partial Par...",
"Combinatorial Category Grammar is (CCG) a lexicalized grammar formalism which is expressed by syntactic category, a logical form representation. There...",
"The high level of heterogeneity between linguistic annotations usually complicates the interoperability of processing modules within an NLP pipeline. ...",
"GermaNet is regarded to be a valuable resource for many German NLP applications, corpus research, and teaching. This demo presents three GUI-based too...",
"Multilingual Automatic Speech Recognition (ASR) systems are of great interest in multilingual environments. We studied the case of the Comunitat Valen...",
"We have integrated the RASP system with the UIMA framework (RASP4UIMA) and used this to parse the XML-encoded version of the British National Corpus (...",
"The Semantic Web of the future will be characterized by using a very large number of ontologies embedded in ontology networks. It is important to prov...",
"Named Entities (NE) are regarded as an important type of semantic knowledge in many natural language processing (NLP) applications. Originally, a limi...",
"This paper presents an algorithm for correcting language errors typical of second-language learners. We focus on preposition errors, which are very co...",
"Although ontologies and linguistic resources play a key role in applied AI and NLP, they have not been developed in a common and systematic way. The l...",
"To achieve true interoperability for valuable linguistic resources different levels of variation need to be addressed. ISO Technical Committee 37, Ter...",
"In this paper we briefly describe the BioSec multimodal biometric database and analyze its use in automatic text-dependent speaker recognition researc...",
"This paper presents a context sensitive spell checking system that uses mixed trigram models, and introduces a new empirically grounded method for bui...",
"The production of rich multilingual speech corpus resources on a large scale is a requirement for many linguistic, phonetic and technological tasks, i...",
"While recent corpus annotation efforts cover a wide variety of semantic structures, work on temporal and causal relations is still in its early stages...",
"Manual categorisation of documents is a time-consuming task that has been significantly alleviated with the deployment of automatic and machine-aided ...",
"This paper discusses ontologization of lexicon access functions in the context of a service-oriented language infrastructure, such as the Language Gri...",
"This paper describes a three-part annotation scheme for superlatives. The first identifies syntactic classes, since superlatives can serve different s...",
"Generally, ontology learning and population is applied as a semi-automatic approach to knowledge acquisition in natural language understanding systems...",
"The Framework for the Evaluation for Machine Translation (FEMTI) contains guidelines for building a quality model that is used to evaluate MT systems ...",
"In this paper we present a corpus of interactions of older and younger users with nine different dialogue systems. The corpus has been fully transcrib...",
"We have obtained the valuable findings about the developmental processes of demonstrative expression skills, which is concerned with the fundamental c...",
"Krahmer et al.&#146;s (2003) graph-based framework provides an elegant and flexible approach to the generation of referring expressions. In this paper...",
"Web count statistics gathered from search engines have been widely used as a resource in a variety of NLP tasks. For some tasks, however, the informat...",
"This paper presents a freely-available, and flexible Wizard of Oz environment for rapid prototyping. The system is designed to investigate the require...",
"Developing a full coreference system able to run all the way from raw text to semantic interpretation is a considerable engineering effort. Accordingl...",
"This paper presents the sequential evaluation of the question answering system SQuaLIA. This system is based on the same sequential process as most st...",
"When a user cannot find a word, he may think of semantically related words that could be used into an automatic process to help him. This paper presen...",
"This paper deals with the treatment of constructed neologisms in a machine translation system. It focuses on a particular issue in Romance languages: ...",
"In this paper we present two experiments conducted for comparison of different language identification algorithms. Short words-, frequent words- and n...",
"Question Answering systems are systems that enable the user to ask questions in natural language and to also receive an answer in natural language. Mo...",
"This paper reports an experience on producing manual word alignments over six different language pairs (all combinations between Portuguese, English, ...",
"Part-of-Speech tagging is generally performed by Markov models, based on bigram or trigram models. While Markov models have a strong concentration on ...",
"Within the scope of the SPACE project, the CHildren&#146;s Oral REading Corpus (CHOREC) is developed. This database contains recorded, transcribed and...",
"Cornetto is a two-year Stevin project (project number STE05039) in which a lexical semantic database is built that combines Wordnet with Framenet-like...",
"This paper introduces a knowledge representation formalism used for annotation of the French MEDIA dialogue corpus in terms of high level semantic str...",
"In this paper, we discuss lemma identification in Japanese morphological analysis, which is crucial for a proper formulation of morphological analysis...",
"Parallel corpora are critical resources for machine translation research and development since parallel corpora contain translation equivalences of va...",
"The paper describes the treatment of some specific syntactic constructions in two treebanks of Latin according to a common set of annotation guideline...",
"OntoSelect is a dynamic web-based ontology library that harvests, analyzes and organizes ontologies published on the Semantic Web. OntoSelect allows s...",
"Detecting the tone or emotive content of a text message is increasingly important in many natural language processing applications. While for the Engl...",
"Structural metadata extraction (MDE) research aims to develop techniques for automatic conversion of raw speech recognition output to forms that are m...",
"In the field of ontology mapping, multilingual ontology mapping is an issue that is not well explored. This paper proposes a framework for mapping of ...",
"Terms, term relevances, and sentence relevances are concepts that figure in many NLP applications, such as Text Summarization. These concepts are impl...",
"In this paper, we discuss methods of measuring the performance of ontology-based information extraction systems. We focus particularly on the Balanced...",
"Basque is a highly inflected and agglutinative language (Alegria et al., 1996). Two-level morphology has been applied successfully to this kind of lan...",
"In this paper we analyse data from the SemEval lexical substitution task in those cases where the annotators indicated that the target word was part o...",
"The field of automated sentiment analysis has emerged in recent years as an exciting challenge to the computational linguistics community. Research in...",
"Our paper focuses on the gain which can be achieved on human transcription of spontaneous and prepared speech, by using the assistance of an ASR syste...",
"The goal of the LILA project was the collection of speech databases over cellular telephone networks of five languages in three Asian countries. Three...",
"In this paper the dialogue act annotation of naive and expert annotators, both annotating the same data, are compared in order to characterise the ins...",
"We present in this article the methods we used for obtaining measures to ensure the quality and well-formedness of a text corpus. These measures allow...",
"The paper presents a set of approaches to extend the automatically created Slovene wordnet with nominal multi-word expressions. In the first approach ...",
"In this paper we present our recent work to develop phonemic and syllabic inventories for Castilian Spanish based on the C-ORAL-ROM corpus, a spontane...",
"The research field of &#147;extracting knowledge bases from text collections&#148; seems to be mature: its target and its working hypotheses are clear...",
"Based on simple methods such as observing word and part of speech tag co-occurrence and clustering, we generate syntactic parses of sentences in an en...",
"A new, linguistically annotated, video database for automatic sign language recognition is presented. The new RWTH-BOSTON-400 corpus, which consists o...",
"Many of the beliefs that one uses to reason about everyday entities and events are neither strictly true or even logically consistent. Rather, people ...",
"Embodied Conversational Agents have typically been constructed for use in limited domain applications, and tested in very specialized environments. On...",
"The purpose of Oriental COCOSDA is to provide the Asian community a platform to exchange ideas, to share information and to discuss regional matters o...",
"In our paper we present a methodology used for low-cost validation of quality of Part-of-Speech annotation of the Prague Dependency Treebank based on ...",
"This paper describes the development of a ground truth dataset of culturally diverse Romanized names in which approximately 70,000 names are matched a...",
"We describe a set of experiments to explore statistical techniques for ranking and selecting the best translations in a graph of translation hypothese...",
"This paper presents MISTRAL, an open source statistical machine translation decoder dedicated to spoken language translation. While typical machine tr...",
"We present an experiment in extracting collocations from the FrameNet corpus, specifically, support verbs such as direct in Environmentalists directed...",
"This paper describes an accurate, extensible method for automatically classifying unknown foreign words that requires minimal monolingual resources an...",
"This paper presents a series of tools for the extraction of specialized corpora from the web and its subsequent analysis mainly with statistical techn...",
"Arrau is a new corpus annotated for anaphoric relations, with information about agreement and explicit representation of multiple antecedents for ambi...",
"Evaluation of Machine Translation (MT) technology is often tied to the requirement for tedious manual judgments of translation quality. While automate...",
"This paper describes the open source SemanticVectors package that efficiently creates semantic vectors for words and documents from a corpus of free t...",
"In this paper, we describe a system that divides example sentences (data set) into clusters, based on the meaning of the target word, using a semi-sup...",
"This paper focuses on the influence of changing the text time frame on the performance of a named entity tagger. We followed a twofold approach to inv...",
"This paper describes CzEng 0.7, a new release of Czech-English parallel corpus freely available for research and educational purposes. We provide basi...",
"We present an approach to the discovery of semantically similar terms that utilizes a web search engine as both a source for generating related terms ...",
"Data Selection has emerged as a common issue in language technologies. We define Data Selection as the choosing of a subset of training data that is m...",
"We present a study of the word interaction networks of Bengali in the framework of complex networks. The topological properties of these networks reve...",
"The Teko corpus composing model offers a decentralized, dynamic way of collecting high-quality text corpora for linguistic research. The resulting cor...",
"This paper describes Babylon, a system that attempts to overcome the shortage of parallel texts in low-density languages by supplementing existing par...",
"Verb lexical semantic properties are only one of the factors that contribute to the determination of the event type expressed by a sentence, which is ...",
"In this paper we discuss the design, acquisition and preprocessing of a Czech audio-visual speech corpus. The corpus is intended for training and test...",
"The paper provides a general introduction to the CLARIN project, a large-scale European research infrastructure project designed to establish an integ...",
"Large speech and text corpora are crucial to the development of a state-of-the-art speech recognition system. This paper reports on the construction a...",
"WordNet has been used extensively as a resource for the Word Sense Disambiguation (WSD) task, both as a sense inventory and a repository of semantic r...",
"The modelling of realistic emotional behaviour is needed for various applications in multimodal human-machine interaction such as the design of emotio...",
"We present and partially evaluate procedures for the extraction of noun+verb collocation candidates from German text corpora, along with their morphos...",
"The huge amount of the available information in the Web creates the need of effective information extraction systems that are able to produce metadata...",
"The paper provides an overview of the Polish Speech Database for taking dictation of legal texts, created for the purpose of LVCSR system for Polish. ...",
"This paper describes a corpus consisting of audio data for automatic space monitoring based solely on the perceived acoustic information. The particul...",
"Text condensation aims at shortening the length of an utterance without losing essential textual information. In this paper, we report on the implemen...",
"The paper deals with the process of designing a phonetically and prosodically rich speech corpus for unit selection speech synthesis. The attention is...",
"The consortium ECESS (European Center of Excellence for Speech Synthesis) has set up a framework for evaluation of software modules and tools relevant...",
"In the context of the CATCH research program that is currently carried out at a number of large Dutch cultural heritage institutions our ambition is t...",
"Research activity on the Portuguese language for speech synthesis and recognition has suffered from a considerable lack of human and material resource...",
"This paper addresses a specific case of the task of lexical acquisition understood as the induction of information about the linguistic characteristic...",
"Active learning (AL) is getting more and more popular as a methodology to considerably reduce the annotation effort when building training material fo...",
"The goal of this work is to introduce an architecture to automatically detect the amount of stress in the speech signal close to real time. For this a...",
"We present a universal Parts-of-Speech (POS) tagset framework covering most of the Indian languages (ILs) following the hierarchical and decomposable ...",
"We report on an on-going research project aimed at increasing the range of translation equivalents which can be automatically discovered by MT systems...",
"We describe and evaluate a prototype system for recognising person and place names in digitised records of British parliamentary proceedings from the ...",
"This paper describes an ongoing project in which we are collecting a learner corpus of Arabic, developing a tagset for error annotation and performing...",
"In this paper, we present a database with speech in different types of background noises. The speech and noise were recorded with a set of different m...",
"Automatic tagging in Spanish has historically faced many problems because of some specific grammatical constructions. One of these traditional pitfall...",
"In this paper we present a new Document Management System called DrStorage. This DMS is multi-platform, JCR-170 compliant, supports WebDav, versioning...",
"In the context of ontology-based information extraction, identity resolution is the process of deciding whether an instance extracted from text refers...",
"Some alternatives to the standard evalb measures for parser evaluation are considered, principally the use of a tree-distance measure, which assigns a...",
"Large-scale grammar-based parsing systems nowadays increasingly rely on independently developed, more specialized components for pre-processing their ...",
"This paper presents the results of a graph-based method for performing knowledge-based Word Sense Disambiguation (WSD). The technique exploits the str...",
"Hardly any other kind of text structures is as notoriously difficult to read as patents. This is first of all due to their abstract vocabulary and the...",
"Treatment of Multiword Expressions (MWEs) is one of the most complicated issues in natural language processing, especially in Machine Translation (MT)...",
"Development of lexical resources is, along with grammar development, one of the main efforts when building multilingual NLP applications. In this pape...",
"LC-STAR II is a follow-up project of the EU funded project LC-STAR (Lexica and Corpora for Speech-to-Speech Translation Components, IST-2001-32216). L...",
"This paper describes the corpus of university lectures that has been recorded in European Portuguese, and some of the recognition experiments we have ...",
"This paper presents AnCora, a multilingual corpus annotated at different linguistic levels consisting of 500,000 words in Catalan (AnCora-Ca) and in S...",
"Morphologically rich languages pose a challenge to the annotators of treebanks with respect to the status of orthographic (space-delimited) words in t...",
"In this paper we present a Japanese-English Bilingual lexicon of technical terms. The lexicon was derived from the first and second NTCIR evaluation c...",
"Within the CLARIN e-science infrastructure project it is foreseen to develop a component-based registry for metadata for Language Resources and Langua...",
"The computational linguistics community in The Netherlands and Belgium has long recognized the dire need for a major reference corpus of written Dutch...",
"Within the framework of the Dutch-Flemish programme STEVIN, the JASMIN-CGN (Jongeren, Anderstaligen en Senioren in Mens-machine Interactie&#146; Corpu...",
"We report the results of a study that investigates the agreement of anaphoric annotations. The study focuses on the influence of the factors text leng...",
"The DAM-LR project aims at virtually integrating various European language resource archives that allow users to navigate and operate in a single unif...",
"We outline work performed within the framework of a current EC project. The goal is to construct a language-independent information system for a speci...",
"This paper is motivated by the demand for more linguistic resources for the study of languages and the improvement of those already existing. The firs...",
"About two years ago, the Max Planck Institute for Psycholinguistics in Nijmegen, The Netherlands, started an initiative to install regional language a...",
"We propose two general and robust methods for enriching resources annotated in the Frame Semantic paradigm with syntactic dependency graphs, which can...",
"Terminology extraction commonly includes two steps: identification of term-like units in the texts, mostly multi-word phrases, and the ranking of the ...",
"The Internet has become the most popular platform for communication. However because most of the modern computer keyboard is Latin-based, Asian langua...",
"The emerging area of Geographic Information Systems (GIS) has proven to add an interesting dimension to many research projects. Within the language-si...",
"We present a tool, BLEU+, which implements various extension to BLEU computation to allow for a better understanding of the translation performance, e...",
"We have performed a set of experiments made to investigate the utility of morphological analysis to improve retrieval of documents written in language...",
"This paper describes the creation of a state-of-the-art answer type detection system capable of recognizing more than 200 different expected answer ty...",
"This paper shows how a research and industry stimulation programme on human language technologies (HLT) for Dutch can be &#147;enhanced&#148; with mor...",
"We address here the need to assist users in rapidly accessing the most important or strategic information in the text corpus by identifying sentences ...",
"This paper presents a multipurpose system for wordnet (WN) development, named Hydra. Hydra is an application for data editing and validation, as well ...",
"This paper proposes a ping-pong document clustering method using NMF and the linkage based refinement alternately, in order to improve the clustering ...",
"This paper presents the complete and consistent ontological annotation of the nominal part of WordNet. The annotation has been carried out using the s...",
"Princeton WordNet (WN.Pr) lexical database has motivated efficient compilations of bulky relational lexicons since its inception in the 1980´s. The Eu...",
"A new approach to handle unknown words in machine translation is presented. The basic idea is to find definitions for the unknown words on the source ...",
"In this paper we present the Cast3LB-CoNLL-SemRol corpus, currently the only corpus of Spanish annotated with dependency syntax and semantic roles, an...",
"This paper focuses on different aspects of collaborative work used to create the electronic version of a dictionary in paper format, edited and printe...",
"The project presented here is a part of a long term research program aiming at a full lexicon grammar for Polish (SyntLex). The main concern of this p...",
"The Spoken Language Communication and Translation System for Tactical Use (TRANSTAC) program is a Defense Advanced Research Agency (DARPA) program to ...",
"Some big languages like English are spoken by a lot of people whose mother tongues are different from. Their second languages often have not only dist...",
"The Spoken Document Processing Working Group, which is part of the special interest group of spoken language processing of the Information Processing ...",
"A frequent problem in automatic categorization applications involving Portuguese language is the absence of large corpora of previously classified doc...",
"A statistical machine translation (SMT) system requires homogeneous training data in order to get domain-sensitive (or context-sensitive) terminology ...",
"The purpose of this paper is to clarify the temporal aspect of terminology focusing on the dictionary&#146;s impact on terms. We used women&#146;s stu...",
"Many of the Japanese ideographs (Chinese characters) have a few meanings. Such ambiguities should be identified by using their contextual information....",
"In this paper we present an algorithm for automatic extraction of textual elements, namely titles and full text, associated with news stories in news ...",
"This paper discusses development and evaluation of a practical, valid and reliable instrument for evaluating the spoken language abilities of second-l...",
"What kinds of lexical resources are helpful for extracting useful information from domain-specific documents? Although domain-specific documents conta...",
"In this paper we describe the construction of an illustrated Japanese Wordnet. We bootstrap the Wordnet using existing multiple existing wordnets in o...",
"This paper presents the design and construction of a Chinese opinion corpus based on the online product reviews. Based on the observation on the chara...",
"Acquiring knowledge from the Web to build domain ontologies has become a common practice in the Ontological Engineering field. The vast amount of free...",
"A number of forensic studies published during the last 50 years report that intoxication with alcohol influences speech in a way that is made manifest...",
"Recently, collaboratively constructed resources such as Wikipedia and Wiktionary have been discovered as valuable lexical semantic knowledge bases wit...",
"Phonetic segmentation is the procedure which is used in many applications of speech processing, both as a subpart of automated systems or as the tool ...",
"Corpus-based approaches and statistical approaches have been the main stream of natural language processing research for the past two decades. Languag...",
"This paper proposes a method of increasing the size of a bilingual lexicon obtained from two other bilingual lexicons via a pivot language. When we ap...",
"The multilingual European Thesaurus on International Relations and Area Studies (European Thesaurus) is a special subject thesaurus for the field of i...",
"The IDEX system is a prototype of an interactive dynamic Information Extraction (IE) system. A user of the system expresses an information request in ...",
"The paper reports on completed work aimed at the creation of a resource, namely, the Greek Textual Entailment Corpus (GTEC) that is appropriate for gu...",
"The National Institute of Information and Communications Technology (NICT) and Nagoya University have been jointly constructing a large scale database...",
"Chinese writing system is not only used by Chinese but also used by Japanese. The motivation of this paper is to extend the architecture of Hantology ...",
"Despite of the importance of lexical resources for a number of NLP applications (Machine Translation, Information Extraction, Question Answering, amon...",
"We describe various syntactic and semantic conditions for finding abstractnouns which refer to concepts of adjectives from a text, in an attempt to ex...",
"This presentation focuses on the semi-automatic extension of Arabic WordNet (AWN) using lexical and morphological rules and applying Bayesian inferenc...",
"This paper presents a feasibility study of a merge between SprogTeknologisk Ordbase (STO), which contains morphological and syntactic information, and...",
"This paper describes the evaluation process of an emotional speech database recorded for standard Basque, in order to determine its adequacy for the a...",
"Open answers in questionnaires contain valuable information that is very time-consuming to analyze manually. We present a method for hypothesis genera...",
"The Dutch HLT agency for language and speech technology (known as TST-centrale) at the Institute for Dutch Lexicology is responsible for the maintenan...",
"This paper is a contribution to formal ontology study. Some entities belong more or less to a class. In particular, some individual entities are attac...",
"In this paper, we investigated how foreign language speakers pronounce Japanese words transliterated using two major Romanization systems, Hepburn and...",
"Many systems have been developed in the past few years to assist researchers in the discovery of knowledge published as English text, for example in t...",
"We describe recent work on MedSLT, a medium-vocabulary interlingua-based medical speech translation system, focussing on issues that arise when handli...",
"Statistical Machine Translation (SMT) is based on alignment models which learn from bilingual corpora the word correspondences between source and targ...",
"The ACL Anthology is a digital archive of conference and journal papers in natural language processing and computational linguistics. Its primary purp...",
"ASV Toolbox is a modular collection of tools for the exploration of written language data both for scientific and educational purposes. It includes mo...",
"In human face-to-face interaction, participants can rely on a number of audio-visual information for interpreting interlocutors&#146; communicative in...",
"The paper presents a project of the Laboratoire Parole & Langage which aims at collecting, annotating and exploiting a corpus of spoken French in a mu...",
"This paper presents our work on the detection of temporal information in web pages. The pages examined within the scope of this study were taken from ...",
"In this paper we describe the methodology and the first steps for the creation of WNTERM (from WordNet and Terminology), a specialized lexicon produce...",
"The aim of this paper is to present the design of a multimodal database suitable for research on new possibilities for automatic diagnosis of patients...",
"Large vocabulary automatic speech recognition (ASR) technologies perform well in known, controlled contexts. However recognition of proper nouns is co...",
"In aiming at research and development on machine translation, we produced a test collection for Japanese-English machine translation in the seventh NT...",
"The construction of a wordnet, a labour-intensive enterprise, can be significantly assisted by automatic grouping of lexical material and discovery of...",
"In this article we present a method for combining different information retrieval models in order to increase the retrieval performance in a Speech In...",
"In biomedical articles, terms with the same surface forms are often used to refer to different entities across a number of model organisms, in which c...",
"Speaker identification and verification systems have a poor performance when model training is done in one language while the testing is done in anoth...",
"This paper describes a novel methodology to perform bilingual terminology extraction, in which automatic alignment is used to improve the performance ...",
"An important problem when using Stochastic Inversion Transduction Grammars is their computational cost. More specifically, when dealing with corpora s...",
"Recently, speech recognition performance has been drastically improved by statistical methods and huge speech databases. Now performance improvement u...",
"This paper describes an ongoing project &#147;Japanese FrameNet (JFN)&#148;, a corpus-based lexicon of Japanese in the FrameNet style. This paper focu...",
"This paper presents some preliminary results of our dependency parser for Thai. It is part of an ongoing project in developing a syntactically annotat...",
"In the few last years, due to the increasing importance of the web, both computational tools and resources need to be more and more visible and easily...",
"In this paper, a large-scale real-world speech database is introduced along with other multimedia driving data. We designed a data collection vehicle ...",
"Distributional, corpus-based descriptions have frequently been applied to model aspects of word meaning. However, distributional models that use corpu...",
"We present the machine learning framework that we are developing, in order to support explorative search for non-trivial linguistic configurations in ...",
"Some time in the future, some spelling error correction system will correct all the errors, and only the errors. We need evaluation metrics that will ...",
"This paper describes the interaction among language resources for an adequate concept annotation of domain texts in several languages. The architectur...",
"This paper presents an approach to computer-assisted teaching of reading abilities using corpus data. The approach is supported by a set of tools for ...",
"We have analyzed the SPEX algorithm by Bernstein and Zobel (2004) for detecting co-derivative documents using duplicate n-grams. Although we totally a...",
"In this paper we propose a partial parsing model which achieves robust parsing with a large HPSG grammar. Constraint-based precision grammars, like th...",
"This work studies the viability of performing heterogeneous automatic MT error analyses. Error analysis is, undoubtly, one of the most crucial stages ...",
"This paper addresses the problem of synchronizing movie subtitles, which is necessary to improve alignment quality when building a parallel corpus out...",
"This paper describes the Norwegian broadcast news speech corpus RUNDKAST. The corpus contains recordings of approximately 77 hours of broadcast news s...",
"State-of-the-art coreference resolution engines show similar performance figures (low sixties on the MUC-7 data). Our system with a rich linguisticall...",
"In the Autonomata project we have collected a corpus of spoken name utterances with manually corrected phonemic transcriptions of these utterances. Th...",
"In this paper we propose a rule-based approach to extract dependency and grammatical functions from the Venice Italian Treebank, a Treebank of written...",
"This paper introduces an ongoing work on developing verb frames for Hindi. Verb frames capture syntactic commonalities of semantically related verbs. ...",
"We present in this paper a comparison between three segmentation systems for the Vietnamese language. Indeed, the majority of Vietnamese words is buil...",
"This paper presents two lexical data bases for Romanian: RoMorphoDict, a dictionary of inflected forms and RoSyllabiDict, a dictionary of syllabified ...",
"We report the construction of a corpus for parser evaluation in the biomedical domain. A 50-abstract subset (492 sentences) of the GENIA corpus (Kim e...",
"In this paper we present an active approach to annotate with lexical and semantic labels an Italian corpus of conversational human-human and Wizard-of...",
"We present the main outcomes of the COREA project: a corpus annotated with coreferential relations and a coreference resolution system for Dutch. In t...",
"We present the main findings and preliminary results of an ongoing project aimed at developing a system for collocation extraction based on contextual...",
"The measurement of conceptual similarity in a hierarchical structure has been proposed by studies such as Wu and Palmer (1994) which have been summari...",
"We present recent work in the area of Cross-Domain Dialogue Act (DA) tagging. We have previously reported on the use of a simple dialogue act classifi...",
"We are currently developing MiniSTEx, a spatiotemporal annotation system to handle temporal and/or geospatial information directly and indirectly expr...",
"This paper presents a methodology for the design and implementation of user-centred language checking applications. The methodology is based on the se...",
"Recent years have seen increasing attention in temporal processing of texts as well as a lot of standardization effort of temporal information in natu...",
"Nowadays portable devices such as smart phones can be used to capture the face of a user simultaneously with the voice input. Server based or even emb...",
"This paper reports on the QAST track of CLEF aiming to evaluate Question Answering on Speech Transcriptions. Accessing information in spoken documents...",
"In human translation, translators first make draft translations and then modify and edit them. In the case of experienced translators, this process in...",
"In this article, we present a method for extracting automatically semantic relations from texts in the medical domain using linguistic patterns. These...",
"It is a challenging task to match similar or related terms/expressions in NLP and Text Mining applications. Two typical areas in need for such work ar...",
"This paper discusses the problem of utilising multiply annotated data in training biomedical information extraction systems. Two corpora, annotated wi...",
"We argue for the necessity of studying human-human spoken conversations of various kinds in order to create user interfaces to databases. An efficient...",
"Although the World Wide Web has late become an important source to consult for the meaning of words, a number of technical terms related to high techn...",
"In this paper we will focus on the lexical-semantic relations in the German wordnet GermaNet. It has been shown that wordnets suffer from the relative...",
"The re-use of spoken word audio collections maintained by audiovisual archives is severely hindered by their generally limited access. The CHoral proj...",
"We present a new coding mechanism, spatiotemporal coding, that allows coders to annotate points and regions in the video frame by drawing directly on ...",
"In this paper we present an extension of the MATE/GNOME annotation scheme for anaphora (Poesio, 2004) which accounts for abstract anaphora in Danish a...",
"We report about a project which brings together Natural Language Processing and eLearning. One of the functionalities developed within this project is...",
"This paper explains our developing Corpus of Japanese classroom Lecture speech Contents (henceforth, denoted as CJLC). Increasing e-Learning contents ...",
"The EVALITA 2007 Parsing Task has been the first contest among parsing systems for Italian. It is the first attempt to compare the approaches and the ...",
"This paper presents a freely available evaluation tool for dependency parsing: MaltEval (http://w3.msi.vxu.se/users/jni/malteval). It is flexible and ...",
"In this paper we present JMWNL, a multilingual extension of the JWNL java library, which was originally developed for accessing Princeton WordNet dict...",
"Semantic annotation of text requires the dynamic merging of linguistically structured information and a &#147;world model&#148;, usually represented a...",
"Over the past five years, the Defense Advanced Research Projects Agency (DARPA) has funded development of speech translation systems for tactical appl...",
"Subcategorization is a kind of knowledge which can be considered as crucial in several NLP tasks, such as Information Extraction or parsing, but the c...",
"Word sketches are part of the Sketch Engine corpus query system. They represent automatic, corpus-derived summaries of the words&#146; grammatical and...",
"Automatic Term recognition (ATR) is a fundamental processing step preceding more complex tasks such as semantic search and ontology learning. From a l...",
"The rapid growth of the Internet means that more information is available than ever before. Multilingual multi-document summarisation offers a way to ...",
"Relation extraction is the task of finding pre-defined semantic relations between two entities or entity mentions from text. Many methods, such as fea...",
"Ontology construction usually requires a domain-specific corpus for building corresponding concept hierarchy. The domain corpus must have a good cover...",
"We report the results of our experiment on assessing the ability of automated MT evaluation metrics to remain sensitive to variations in MT quality as...",
"We report on the evaluation of information structural annotation according to the Linguistic Information Structure Annotation Guidelines (LISA, (Dippe...",
"This paper presents the process of acquiring a large, domain independent, taxonomy from the German Wikipedia. We build upon a previously implemented p...",
"Air traffic control (ATC) is based on voice communication between pilots and controllers and uses a highly task and domain specific language. Due to t...",
"Dating of contents is relevant to multiple advanced Natural Language Processing (NLP) applications, such as Information Retrieval or Question Answerin...",
"This paper reports on the design and construction of a bio-event annotated corpus which was developed with a specific view to the acquisition of seman...",
"This work presents improvements of a large-scale Arabic to French statistical machine translation system over a period of three years. The development...",
"In languages that use diacritical characters, if these special signs are stripped-off from a word, the resulted string of characters may not exist in ...",
"This paper describes part of the corpus collection efforts underway in the EC funded Companions project. The Companions project is collecting substant...",
"Entities - people, organizations, locations and the like - have long been a central focus of natural language processing technology development, since...",
"The release of the Enron corpus provided a unique resource for studying aspects of email use, because it is largely unfiltered, and therefore presents...",
"The paper describes the project whose main purpose is the creation of the Slovene terminology web portal, funded by the Slovene Research Agency and th...",
"The present contribution aims at increasing our understanding of automatic speech recognition (ASR) errors involving frequent homophone or almost homo...",
"Chemistry research papers are a primary source of information about chemistry, as in any scientific field. The presentation of the data is, predominan...",
"A speech and noise corpus dealing with the extreme conditions of the motorcycle environment is developed within the MoveOn project. Speech utterances ...",
"In this paper, we determine the relationships between nursing activities and nurseing conversations based on the principle of maximum entropy. For ana...",
"In this paper we discuss how linguistic and geographic distances can be related using a 3D visualization. We will convert linguistic data for location...",
"A new procedure is described for generating pronunciations for a dictionary of place-names in a less-resourced language (Welsh, spoken in Wales, UK). ...",
"This paper proposes a distributional model of word use and word meaning which is derived purely from a body of text, and then applies this model to de...",
"With the appearance of Semantic Web technologies, it becomes possible to develop novel, sophisticated question answering systems, where ontologies are...",
"While the Web is facing interesting new changes in the way users access, interact and even participate to its growth, the most traditional application...",
"In recent years, language resources acquired from theWeb are released, and these data improve the performance of applications in several NLP tasks. Al...",
"Each year NIST releases a set of question, document id, answer-triples for the factoid questions used in the TREC Question Answering track. While this...",
"In this paper we describe the result of manually annotating I-CAB, the Italian Content Annotation Bank, by expressions of private state (EPSs), i.e., ...",
"We describe an automatic projection algorithm for transferring frame-semantic information from English to Italian texts as a first sep towards the cre...",
"We provide an overview of corpus building efforts at the Jena University Language & Information Engineering (JULIE) Lab which are focused on life scie...",
"Data models and encoding formats for syntactically annotated text corpora need to deal with syntactic ambiguity; underspecified representations are pa...",
"It is known that POS tagging is not very accurate for unknown words (words which the POS tagger has not seen in the training corpora). Thus, a first s...",
"In this article, we propose a web based listening test system that can be used with a large range of listeners. Our main goals were to make the config...",
"The first release of the German Ph@ttSessionz speech database contains read and spontaneous speech from 864 adolescent speakers and is the largest dat...",
"This paper describes a method of automatic emotional degree labeling for speaker&#146;s anger utterances during natural Japanese dialog. First, we exp...",
"This paper describes the design, implementation and population of a lexical resource for biology and bioinformatics (the BioLexicon) developed within ...",
"The paper presents a comparative study of semantic and lexical relations defined and adopted in WordNet and EuroWordNet. This document describes the e...",
"This paper describes the building of a valency lexicon of Arabic verbs using a morphologically and syntactically annotated corpus, the Prague Arabic D...",
"Spoken corpora provide a critical resource for research, development and evaluation of spoken dialog systems. This paper describes the telephone spoke...",
"This paper presents recent results of the application of the task-based Browser Evaluation Test (BET) to meeting browsers, that is, interfaces to mult...",
"This paper describes SW1, the first version of a semantically annotated snapshot of the English Wikipedia. In recent years Wikipedia has become a valu...",
"In this paper we present a usability measure adapted to mobile services, which is based on the well-known theoretical framework defined in the ISO 924...",
"Recent years have seen an increasing interest in developing standards for linguistic annotation, with a focus on the interoperability of the resources...",
"This paper describes a multichannel acoustic data collection recorded under the European DICIT project, during the Wizard of Oz (WOZ) experiments carr...",
"In this paper we present results from using Random indexing for Latent Semantic Analysis to handle Singular Value Decomposition tractability issues. I...",
"We present an approach to creating a treebank of sentences using multiple notations or linguistic theories simultaneously. We illustrate the method by...",
"A core ontology is a mid-level ontology which bridges the gap between an upper ontology and a domain ontology. Automatic Chinese core ontology constru...",
"The ability to make progress in Computational Linguistics depends on the availability of large annotated corpora, but creating such corpora by hand an...",
"The ultimate goal when building dialogue systems is to satisfy the needs of real users, but quality assurance for dialogue strategies is a non-trivial...",
"Morfette is a modular, data-driven, probabilistic system which learns to perform joint morphological tagging and lemmatization from morphologically an...",
"Automated extraction of ontological knowledge from text corpora is a relevant task in Natural Language Processing. In this paper, we focus on the prob...",
"In order to improve the flexibility and the precision of an automatic phone segmentation system for a type of expressive speech, the dubbing into Fren...",
"This paper presents the application of inheritance to the formal taxonomy (is-a) of a semantically rich Language Resource based on the Generative Lexi...",
"In this paper we present the procedure we followed to develop the Italian Super Sense Tagger. In particular, we adapted the English SuperSense Tagger ...",
"Polarizing discussions about political and social issues are common in mass media. Annotations on the degree to which a sentence expresses an ideologi...",
"We present the results of an agreement task carried out in the framework of the KNOW Project and consisting in manually annotating an agreement sample...",
"Speech synthesis by unit selection requires the segmentation of a large single speaker high quality recording. Automatic speech recognition techniques...",
"This paper presents our findings on the feasibility of doing pronoun resolution for biomedical texts, in comparison with conducting pronoun resolution...",
"In this paper we present a Linguistic Meta-Model (LMM) allowing a semiotic-cognitive representation of knowledge. LMM is freely available and integrat...",
"After a long history of compilation of our own lexical resources, EDR Japanese/English Electronic Dictionary, and discussions with major players on de...",
"In this paper, we investigate quasi-abstractive summaries, a new type of machine-generated summaries that do not use whole sentences, but only fragmen...",
"This paper describes the creation of a bilingual corpus of inter-linked events for Italian and English. Linkage is accomplished through the Inter-Ling...",
"The majority of work described in this paper was conducted as part of the Recovering Evidence from Video by fusing Video Evidence Thesaurus and Video ...",
"The paper describes a method of word phonosemantics estimation. We treat phonosemantics as a subconscious emotional perception of word sounding indepe...",
"The PIT corpus is a German multi-media corpus of multi-party dialogues recorded in a Wizard-of-Oz environment at the University of Ulm. The scenario i...",
"This paper presents various strategies for improving the extraction performance of less prominent relations with the help of the rules learned for sim...",
"This paper analyses some general issues about human language technology evaluation, focusing on economic aspects. It first provides a scientific ratio...",
"To answer the critical need for sharable, reusable annotated resources with rich linguistic annotations, we are developing a Manually Annotated Sub-Co...",
"This paper proposes an extension of Sumida and Torisawa&#146;s method of acquiring hyponymy relations from hierachical layouts in Wikipedia (Sumida an...",
"In this paper, we report our work on the creation of a number of lexical resources that are crucial for an interlingua based MT from English to other ...",
"This paper deals with the relationship between weblog content and time. With the proposed temporal mutual information, we analyze the collocations in ...",
"Regulus is an Open Source platform that supports construction of rule-based medium-vocabulary spoken dialogue applications. It has already been used t...",
"This paper presents EASY, which has been the first campaign evaluating syntactic parsers on all the common syntactic phenomena and a large set of depe...",
"We present an approach for the cross-lingual induction of speech recognition grammars that separates the task of translation from the task of grammar ...",
"This paper reports on the main phases of a research which aims at enhancing a maritime terminological database by means of a set of terms belonging to...",
"An ontological knowledge management system requires dynamic and encapsulating operation in order to share knowledge among communities. The key to succ...",
"We discuss a named entity recognition system for Arabic, and show how we incorporated the information provided by MADA, a full morphological tagger wh...",
"This paper describes a solution to lexical transfer as a trade-off between a dictionary and an ontology. It shows its association to a translation too...",
"The work described in this paper aims to enrich the noun classifications of an existing database of lexical resources (de Matos and Ribeiro, 2004) add...",
"This paper presents the QALL-ME benchmark, a multilingual resource of annotated spoken requests in the tourism domain, freely available for research p...",
"Building a Linguistic Resource (LR) is a task requiring a huge quantitative of means, human resources and funds. Though finalization of the developmen...",
"Spectral clustering is a powerful clustering method for document data set. However, spectral clustering needs to solve an eigenvalue problem of the ma...",
"EVALITA 2007, the first edition of the initiative devoted to the evaluation of Natural Language Processing tools for Italian, provided a shared framew...",
"In this paper we discuss a rule-based approach to chunking sentences in Croatian, implemented using local regular grammars within the NooJ development...",
"This paper describes in detail the data that was collected and annotated during the third and final year of the CHIL project. This data was used for t...",
"Foreign name expressions written in Chinese characters are difficult to recognize since the sequence of characters represents the Chinese pronunciatio...",
"The present paper reports on a preparatory research for building a language corpus annotation scenario capturing the discourse relations in Czech. We ...",
"SECTra_w is a web-oriented system mainly dedicated to the evaluation of MT systems. After importing a source corpus, and possibly reference translatio...",
"In the present paper we report on the development of a cluster of web services of language technology for Portuguese that we named as LXService. These...",
"Recently the LATL has undertaken the development of a multilingual translation system based on a symbolic parsing technology and on a transfer-based t...",
"The development of natural language processing (NLP) components is resource-intensive and therefore justifies exploring ways of reducing development t...",
"The paper presents two experiments of unsupervised classification of Italian noun phrases. The goal of the experiments is to identify the most promine...",
"We present TextPro, a suite of modular Natural Language Processing (NLP) tools for analysis of Italian and English texts. The suite has been designed ...",
"We have analyzed system rankings for person name search algorithms using a data set for which several versions of ground truth were developed by emplo...",
"This paper describes the development of a written corpus of argumentative reasoning. Arguments in the corpus have been analysed using state of the art...",
"Accessing structured data in the form of ontologies requires training and learning formal query languages (e.g., SeRQL or SPARQL) which poses signific...",
"This paper describes a project aimed at converting a legacy representation of English idioms into an XML-based format. The project is set in the conte...",
"Being the client&#146;s first interface, call centres worldwide contain a huge amount of information of all kind under the form of conversational spee...",
"Lexical ontologies and semantic lexicons are important resources in natural language processing. They are used in various tasks and applications, espe...",
"In this paper we address the issue of developing an interoperable infrastructure for language resources and technologies. In our approach, called UFRA...",
"The lack of structure in the content of email messages makes it very hard for data channelled between the sender and the recipient to be correctly int...",
"The availability of large amounts of data is a fundamental prerequisite for building handwriting recognition systems. Any system needs a test set of l...",
"We present a topic boundary detection method that searches for connections between sequences of utterances in multi party dialogues. The connections a...",
"In this paper we present an overview on the development of a large vocabulary continuous speech recognition (LVCSR) system for Khmer, the official lan...",
"For compounding languages, a great part of the topical semantics is transported via nominal compounds. Various applications of natural language proces...",
"This paper presents a corpus study of parenthetical constructions in two different corpora: the Penn Discourse Treebank (PDTB, (PDTBGroup, 2008)) and ...",
"The present paper deals with the design and the annotation of a Greek real-world emotional speech corpus. The speech data consist of recordings collec...",
"We present work on a three-stage system to detect and classify disfluencies in multi party dialogues. The system consists of a regular expression base...",
"Part-of-speech or morphological tags are important means of annotation in a vast number of corpora. However, different sets of tags are used in differ...",
"The objective of the Semiotic-based Ontology Evaluation Tool (S-OntoEval) is to evaluate and propose improvements to a given ontological model. The ev...",
"The influence of English as a global language continues to grow to an extent that its words and expressions permeate the original forms of other langu...",
"This paper investigates a new evaluation method for assessing the coherence of computer-aided summaries, justified by the inappropriacy of existing ev...",
"The NIST Automatic Content Extraction (ACE) Evaluation expands its focus in 2008 to encompass the challenge of cross-document and cross-language globa...",
"This paper presents OMINE, an opinion mining system which aims to identify concepts such as products and their attributes, and analyze their correspon...",
"Recently, there has been an emphasis on creating shared resources for natural language processing applications. This has resulted in the development o...",
"In this paper we present how resources and tools developed within the Human Language Technology Group at the University of Belgrade can be used for tu...",
"This paper describes a study of the levels at which different rhetorical relations occur in rhetorical structure trees. In a previous empirical study ...",
"We propose a set of heuristics for improving annotation quality of very large corpora efficiently. The Xinhua News portion of the Chinese Gigaword Cor...",
"In this paper we describe an approach that both creates crosslingual acoustic monophone model sets for speech recognition tasks and objectively predic...",
"We evaluate the extent to which the distinction between semantically core and non-core dependents as used in the FrameNet corpus corresponds to the tr...",
"This paper presents an annotation scheme for marking subjective content in meetings, specifically the opinions and sentiments that participants expres...",
"We present an evaluation of inter-sentential coreference annotation in the context of manually created semantic networks. The semantic networks are co...",
"In this paper Semantic Press, a tool for the automatic press review, is introduced. It is based on Text Mining technologies and is tailored to meet th...",
"We describe the creation of a corpus that supports a real-world hierarchical text categorization task in the domain of electronic rulemaking (eRulemak...",
"This paper describes tools and techniques for accessing large quantities of speech data and for the visualisation of discourse interactions and events...",
"This paper introduces a method for creating a subjectivity lexicon for languages with scarce resources. The method is able to build a subjectivity lex...",
"In this paper, we describe an approach that aims to model heterogeneous resources for information extraction. Document is modeled in graph representat...",
"The Arabic Treebank (ATB), released by the Linguistic Data Consortium, contains multiple annotation files for each source file, due in part to the rol...",
"There are conflicting views in the literature as to the role of listener-adaptive processes in language production in general and articulatory reducti...",
"As many popular text genres such as blogs or news contain opinions by multiple sources and about multiple targets, finding the sources and targets of ...",
"This paper presents resources and strategies for persuasive natural language processing. After the introduction of a specifically tagged corpus, some ...",
"West African languages are written with alphabets that comprize non classical Latin characters. It is possible to design virtual keyboards which allow...",
"This paper reports on the annotation of all English verbs included in WordNet 2.0 with TimeML event classes. Two annotators assign each verb present i...",
"Evaluation campaigns have become an established way to evaluate automatic systems which tackle the same task. This paper presents the first edition of...",
"Semantic databases are a stable starting point in developing knowledge based systems. Since creating language resources demands many temporal, financi...",
"This paper describes methods used for generating a morphological lexicon of organization entity names in Croatian. This resource is intended for two p...",
"In this paper we present an approach to terminology recognition whereby a sublanguage term (e.g. an aircraft engine component term extracted from a ma...",
"Reported speech in the form of direct and indirect reported speech is an important indicator of evidentiality in traditional newspaper texts, but also...",
"In this paper a first implementation of a tool for valence shifting of natural language texts, named Valentino (VALENced Text INOculator), is presente...",
"In this paper we investigate the coverage of the two knowledge sources WordNet and Wikipedia for the task of bridging resolution. We report on an anno...",
"What&#146;s the best way to assess the performance of a semantic component in an NLP system? Tradition in NLP evaluation tells us that comparing outpu...",
"We discuss factors that affect human agreement on a semantic labeling task in the art history domain, based on the results of four experiments where w...",
"ProPOSEL is a prototype prosody and PoS (part-of-speech) English lexicon for Language Engineering, derived from the following language resources: the ...",
"Producing machine translation (MT) for the many minority languages in the world is a serious challenge. Minority languages typically have few resource...",
"We describe techniques for the automatic detection of relationships among domain entities (e.g. genes, proteins, diseases) mentioned in the biomedical...",
"The metadata management system for speech corpora &#147;memasysco&#148; has been developed at the Institut f&#252r Deutsche Sprache (IDS) and is applied f...",
"Existing techniques extract term candidates by looking for internal and contextual information associated with domain specific terms. The algorithms a...",
"In this paper we present and discuss the results of a text coherence experiment performed on a small corpus of Romanian text from a number of alternat...",
"In current phrase-based Statistical Machine Translation systems, more training data is generally better than less. However, a larger data set eventual...",
"In this paper, we present a linguistic resource that annotates event structures in texts. We consider an event structure as a collection of events tha...",
"In this paper, we describe NineOneOne (9-1-1), a system designed to recognize and translate Spanish emergency calls for better dispatching. We analyze...",
"This paper proposes a new method of the sentiment analysis utilizing inter-sentence structures especially for coping with reversal phenomenon of word ...",
"Patients require access to Electronic Patient Records, however medical language is often too difficult for patients to understand. Explaining records ...",
"This paper describes a syllabification based conversion method for converting romanized Persian text to the traditional Arabic-based writing system. T...",
"Motivated by the expense in time and other resources to produce hand-crafted grammars, there has been increased interest in automatically obtained wid...",
"In this paper we present contrastive colour studies done using COMPARA, the largest edited parallel corpus in the world (as far as we know). The studi...",
"We describe a new multimodal corpus currently under development. The corpus consists of videos of task-oriented dialogues that are annotated for speak...",
"In this paper we share our experience and describe the methodologies that we have used in designing and recording large speech databases for applicati...",
"This paper discusses the use of computational linguistic technology to extract definitions from a large corpus of German court decisions. We present a...",
"We aim to characterize the comparability of corpora, we address this issue in the trilingual context through the distinction of expert and non expert ...",
"In this paper we deal with a recently developed large Czech MWE database containing at the moment 160,000 MWEs (treated as lexical units). It was comp...",
"Systems that automatically process sign language rely on appropriate data. We therefore present the ATIS sign language corpus that is based on the dom...",
"The extraction of flat concepts out of a given word sequence is usually one of the first steps in building a spoken language understanding (SLU) or di...",
"This article is interested in the problem of the linguistic content of a speech corpus. Depending on the target task, the phonological and linguistic ...",
"Managing large groups of human judges to perform any annotation task is a challenge. Linguistic Data Consortium coordinated the creation of manual mac...",
"We present the second version of the Penn Discourse Treebank, PDTB-2.0, describing its lexically-grounded annotations of discourse relations and their...",
"The Linguistic Data Consortium (LDC) seeks to provide its members with quality linguistic resources and services. In order to pursue these ideals and ...",
"Terminologies and other knowledge resources are widely used to aid entity recognition in specialist domain texts. As well as providing lexicons of spe...",
"We present a new corpus for computational stylometry, more specifically authorship attribution and the prediction of author personality from text. Bec...",
"This paper presents a corpus-based study of the discourse connective &#147;in contrast&#148;. The corpus data are drawn from the British National Corp...",
"In this paper we describe some studies of Portuguese-English word alignment, focusing on (i) measuring the importance of the coupling between dictiona...",
"This paper describes a newly created text corpus of news articles that has been annotated for cross-document co-reference. Being able to robustly reso...",
"In this paper, we reported experiments of unsupervised automatic acquisition of Italian and English verb subcategorization frames (SCFs) from general ...",
"This paper presents the evaluation of the dictionary look-up component of Mayo Clinic&#146;s Information Extraction system. The component was tested o...",
"We present a knowledge-based coreference resolution system for noun phrases in Hungarian texts. The system is used as a module in an automated psychol...",
"Pattern matching, or querying, over annotations is a general purpose paradigm for inspecting, navigating, mining, and transforming annotation reposito...",
"This paper presents a method for compiling a large-scale bilingual corpus from a database of movie subtitles. To create the corpus, we propose an algo...",
"This poster presents an ISO framework for the standardization of syntactic annotation (SynAF). The normative part SynAF is concerned with a metamodel ...",
"This paper describes a collection of correlated communicative samples collected from the same individuals across six diverse genres. Three of the genr...",
"The goal of the DARPA MADCAT (Multilingual Automatic Document Classification Analysis and Translation) Program is to automatically convert foreign lan...",
"We describe methods for extracting interesting factual relations from scientific texts in computational linguistics and language technology taken from...",
"We evaluate discriminative parse reranking and parser self-training on a new English test set using four versions of the Charniak parser and a variety...",
"The Linguistic Data Consortium (LDC) creates a variety of linguistic resources - data, annotations, tools, standards and best practices - for many spo...",
"The number and sizes of parallel corpora keep growing, which makes it necessary to have automatic methods of processing them: combining, checking and ...",
"This paper describes experimental use of the multi-agent architecture to integrate Natural Language and Information Systems research and teaching, by ...",
"Parallel text is one of the most valuable resources for development of statistical machine translation systems and other NLP applications. The Linguis...",
"This paper presents three electronic collections of polarity items: (i) negative polarity items in Romanian, (ii) negative polarity items in German, a...",
"As huge quantities of documents have become available, services using natural language processing technologies trained by huge corpora have emerged, s...",
"One of the aims of the Language Technology for eLearning project is to show that Natural Language Processing techniques can be employed to enhance the...",
"Semantic similarity is a key issue in many computational tasks. This paper goes into the development and evaluation of two common ways of automaticall...",
"Evaluation of machine translation (MT) output is a challenging task. In most cases, there is no single correct translation. In the extreme case, two t...",
"The paper gives a comprehensive overview over the results, the concepts and the methods which were developed and used to create the Pronouncing Dictio...",
"The paper will give an overview of developments in Estonia in the field of Human Language Technologies. Despite of the fact that Estonian is one of th...",
"Looking for a better understanding of spontaneous speech-related phenomena and to improve automatic speech recognition (ASR), we present here a study ...",
"This paper describes a method of accurately projecting Propbank roles onto constituents in the CCGbank and automatically annotating verbal categories ...",
"This paper reports the principles behind designing a tagset to cover Russian morphosyntactic phenomena, modifications of the core tagset, and its eval...",
"In Japanese, the syntactic structure of a sentence is generally represented by the relationship between phrasal units, bunsetsus in Japanese, based on...",
"In this paper, we propose a new phrase-based translation model based on inter-lingual triggers. The originality of our method is double. First we iden...",
"Recent years have seen increased interest within the speaker recognition community in high-level features including, for example, lexical choice, idio...",
"In this work, we examine and attempt to extend the coverage of a German HPSG grammar. We use the grammar to parse a corpus of newspaper text and evalu...",
"The Italian particle &#147;ne&#148; exhibits interesting anaphoric properties that have not been yet explored in depth from a corpus and computational...",
"We report on the construction of a gold-standard dataset consisting of annotated clinical notes suitable for evaluating our biomedical named entity re...",
"Evaluating the output of NLG systems is notoriously difficult, and performing assessments of text quality even more so. A range of automated and subje...",
"We describe the induction of lexical resources from unannotated corpora that are aligned with treebank grammars, providing a systematic correspondence...",
"We implement several different methods for generating jokes in English. The common theme is to intentionally produce poor utterances by breaking Grice...",
"This paper presents a general methodology to mapping EuroWordNets (Vossen, 1998) to the Suggested Upper Merged Ontology (SUMO; Niles and Pease (2001))...",
"We report on an effort to build a corpus of Modern Hebrew tagged with part-of-speech and morphology. We designed a tagset specific to Hebrew while foc...",
"This paper discusses the design, recording and preprocessing of a Czech sign language corpus. The corpus is intended for training and testing of sign ...",
"This paper describes a Name Matching Evaluation Laboratory that is a joint effort across multiple projects. The lab houses our evaluation infrastructu...",
"The research project &#147;German Today&#148; aims to determine the amount of regional variation in (near-)standard German spoken by young and older e...",
"The Arabic Treebank team at the Linguistic Data Consortium has significantly revised and enhanced its annotation guidelines and procedure over the pas...",
"When dealing with large, distributed systems that use state-of-the-art components, individual components are usually developed in parallel. As develop...",
"Lexicon schemas and their use are discussed in this paper from the perspective of lexicographers and field linguists. A variety of lexicon schemas hav...",
"Fine-grained subjectivity analysis has been the subject of much recent research attention. As a result, the field has gained a number of working defin...",
"Although answering list questions is not a new research area, answering them automatically still remains a challenge. The median F-score of systems th...",
"Laughter is an intrinsic component of human-human interaction, and current automatic speech understanding paradigms stand to gain significantly from i...",
"In this paper, we present HeiNER, the multilingual Heidelberg Named Entity Resource. HeiNER contains 1,547,586 disambiguated English Named Entities to...",
"The paper describes the construction and usage of the Romanian version of the TimeBank corpus. The success rate of 96.53% for the automatic import of ...",
"Vector-based models of lexical semantics retrieve semantically related words automatically from large corpora by exploiting the property that words wi...",
"This paper discusses how Information Extraction is used to understand and manage Dialogue in the EU-funded Companions project. This will be discussed ...",
"Information extraction from large data repositories is critical to Information Management solutions. In addition to prerequisite corpus analysis, to d...",
"This paper discusses findings of a frame-based contrastive text analysis, using the large-scale and precise descriptions of semantic frames provided b...",
"Word Sense Disambiguation (WSD) is an intermediate task that serves as a means to an end defined by the application in which it is to be used. However...",
"Deep processing of natural language requires large scale lexical resources that have sufficient coverage at a sufficient level of detail and accuracy ...",
"The RITEL project aims to integrate a spoken language dialogue system and an open-domain information retrieval system in order to enable human users t...",
"This paper discusses a framework for development of bilingual and multilingual comprehension assistants and presents a prototype implementation of an ...",
"Low-density languages raise difficulties for standard approaches to natural language processing that depend on large online corpora. Using Persian as ...",
"Discourse structure and coherence relations are one of the main inferential challenges addressed by computational pragmatics. The present study focuse...",
"Roget&#146;s Thesaurus and WordNet are very widely used lexical reference works. We describe an automatic mapping procedure that effectively produces ...",
"Case frames are an important knowledge base for a variety of natural language processing (NLP) systems. For the practical use of these systems in the ...",
"Fixed, limited budgets often constrain the amount of expert annotation that can go into the construction of annotated corpora. Estimating the cost of ...",
"In this paper we describe the design and production of Catalan database for building synthetic voices. Two speakers, with 10 hours per speaker, have r...",
"The growing dependence of modern society on the Web as a vital source of information and communication has become inevitable. However, the Web has bec...",
"In this paper, we define the task of Number Identification in natural context. We present and validate a language-independent semi-automatic approach ...",
"Progress in the Machine Translation (MT) research community, particularly for statistical approaches, is intensely data-driven. Acquiring source langu...",
"To create the first Hungarian WSD corpus, 39 suitable word form samples were selected for the purpose of word sense disambiguation. Among others, sele...",
"Linguists have long been producing grammatical decriptions of yet undescribed languages. This is a time-consuming process, which has already adapted t...",
"The paper describes the project held within Russian National Corpus (http://www.ruscorpora.ru). Beside such obligatory constituents of a linguistic co...",
"People use the Internet to find a wide variety of images. Existing image search engines do not understand the pictures they return. The introduction o...",
"This paper describes a database of 11 dependency treebanks which were unified by means of a two-dimensional graph format. The format was evaluated wit...",
"In the present contribution we start with an overview of the linguistic situation of Luxembourg. We then describe specificities of spoken and written ...",
"The explicit introduction of morphosyntactic information into statistical machine translation approaches is receiving an important focus of attention....",
"For increased speed in developing gigaword language resources for medium resource density languages we integrated several FOSS tools in the HUN* toolk...",
"In this paper, quantitative analyses of the delay in Japanese-to-English (J-E) and English-to-Japanese (E-J) interpretations are described. The Simult...",
"This paper, the fifth in a series of biennial progress reports, reviews the activities of the Linguistic Data Consortium with particular emphasis on g...",
"In this work we propose a new strategy for the authorship identification problem and we test it on an example from Romanian literature: did Radu Albal...",
"Corpus based methods are increasingly used for speech technology applications and for the development of theoretical or computer models of spoken lang...",
"Metadata registries comprising sets of categories to be used in data collections exist in many fields. The purpose of a metadata registry is to facili...",
"Many applications of computational linguistics are greatly influenced by the quality of corpora available and as automatically generated corpora conti...",
"Many NLP modules and applications require the availability of a module for wide-coverage inflectional analysis. One way to obtain such analyses is to ...",
"In this paper we describe ANNALIST (Annotation, Alignment and Scoring Tool), a scoring system for the evaluation of the output of semantic annotation ...",
"In the field of Natural Language Processing, in order to work out a thematic representation system of general knowledge, methods relying on thesaurus ...",
"We describe ongoing work in semi-automatic annotating corpus, with the goal to answer why-question in question answering system and give a constructio...",
"This paper describes ODL, a description language for lexical information that is being developed within the context of a national project called MLRS ...",
"This paper summarizes the annotation of fine-grained entailment relationships in the context of student answers to science assessment questions. We an...",
"The output of a speech recognition system is not always ideal for subsequent downstream processing, in part because speakers themselves often make mis...",
"In many applications of natural language processing (NLP) grammatically tagged corpora are needed. Thus Part of Speech (POS) Tagging is of high import...",
"In the context of Natural Language Processing, annotation is about recovering implicit information that is useful for natural language applications. I...",
"This paper presents a supervised method for the detection and extraction of Causal Relations from open domain text. First we give a brief outline of t...",
"In this paper, we present the details of creating a pilot Arabic proposition bank (Propbank). Propbanks exist for both English and Chinese. However th...",
"Spock is an open source tool for the easy deployment of time-aligned corpora. It is fully web-based, and has very limited server-side requirements. It...",
"This paper addresses a novel approach that integrates two different types of information resources: the World Wide Web and libraries. This approach is...",
"A Hungarian multimodal spontaneous expressive speech corpus was recorded following the methodology of a similar French corpus. The method relied on a ...",
"Originally conceived as a &#147;na&#239ve&#148; baseline experiment using traditional n-gram language models as classifiers, the NCleaner system has turne...",
"We introduce a low-complexity method for acquiring fine-grained classes of named entities from the Web. The method exploits the large amounts of textu...",
"Voss et al. (2006) analyzed newswire translations of three DARPA GALE Arabic-English MT systems at the segment level in terms of subjective judgmen+F9...",
"In this paper we discuss an approach to the semi-automatic extraction and classification of the compounds extracted from German corpora. Compound nomi...",
"Traditional Authorship Attribution models extract normalized counts of lexical elements such as nouns, common words and punctuation and use these norm...",
"Developing resources which can be used for Natural Language Processing is an extremely difficult task for any language, but is even more so for less p...",
"We present new direct data analysis showing that dynamically-built context-dependent phrasal translation lexicons are more useful resources for phrase...",
"The project described in this paper is funded by the French Ministry of Research. It aims at providing producers of Language Resources, and HLT player...",
"This paper describes the latest developments in ELRA&#146;s services within the field of Language Resources (LR). These developments focus on 4 main g...",
"The JOSmorphosyntactic resources for Slovene consist of the specifications, lexicon, and two corpora: jos100k, a 100,000 word balanced monolingual sam...",
"In this paper we present an evaluation resource for geographic information retrieval developed within the Cross Language Evaluation Forum (CLEF). The ...",
"This paper describes the evaluation methodology used to evaluate the TC-STAR speech-to-speech translation (SST) system and the results from the third ...",
"This paper presents the results of the NEOLOGOS project: a children database and an optimized adult database for the French language. A new approach w...",
"The original Mixer corpus was designed to satisfy developing commercial and forensic needs. The resulting Mixer corpora, Phases 1 through 5, have evol...",
"Notwithstanding its acknowledged richness, the SIMPLE semantic model does not offer the representational vocabulary for encoding some conceptual links...",
"This paper introduces a new architecture that aims at combining molecular biology data with information automatically extracted from relevant scientif...",
"The InFile project (INformation, FILtering, Evaluation) is a cross-language adaptive filtering evaluation campaign, sponsored by the French National R...",
"In this paper we present the PASSAGE project which aims at building automatically a French Treebank of large size by combining the output of several p...",
"This paper presents an approach to annotation that BAE Systems has employed in the DARPA GALE Phase 2 Distillation evaluation. The purpose of the GALE...",
"Nowadays, there are hundreds of Natural Language Processing applications and resources for different languages that are developed and/or used, almost ...",
"The identification of class instances within unstructured text for either the purposes of Ontology population or semantic annotation are usually limit...",
"The present communication brings to the fore the work undertaken at the Royal Institute of the Amazigh Culture (IRCAM, henceforth) within the Language...",
"The importance of evaluation in promoting research and development in the information retrieval and natural language processing domains has long been ...",
"We describe a methodology for evaluating the statistical performance of information distillation systems and apply it to a simple illustrative example...",
"This paper describes the collect and transcription of a large set of Arabic broadcast news speech data. A total of more than 2000 hours of data was tr...",
"After the successful completion of the NEMLAR project 2003-2005, a new opportunity for a project was opened by the European Commission, and a group of...",
"This paper deals with a multilingual relational lexical database of proper name, Prolexbase, a free resource available on the CNRTL website. The Prole...",
"In this paper two highly innovative digital editions will be presented. For the creation and the implementation of these editions the latest developme...",
"In this paper we present a novel approach to the incremental incorporation of semantic information in natural language processing which does not fall ...",
"We present initial results from an international and multi-disciplinary research collaboration that aims at the construction of a reference corpus of ...",
"This paper presents the results of a joint effort of a group of multimodality researchers and tool developers to improve the interoperability between ...",
"Catchwords refer to popular words or phrases within certain area in certain period of time. In this paper, we propose a novel approach for automatic C...",
"Our goal is to provide a web-based platform for the long-term preservation and distribution of a heterogeneous collection of linguistic resources. We ...",
"One of the most challenging tasks for uniformed service personnel serving in foreign countries is effective verbal communication with the local popula..."];
var stop_word_list=["the","and","at","in","on","with","an","of","but","here","there","that","which","from","to","too","also","when","what","who","where","are","is","will",];var jss_index=["aaa","additionalterm","aise","ambulance","andrepositorie","aparticular","arrestedv","attributioni","barrera","berry","bonino","byimplement","ccm","ciencia","combinations","connected","correctif","custormer","deleted","dialoguetype","ditch","dynamicsand","elvas","erfinden","excel","faux","ffs","fls","francevincent","gearon","goodidea","hamming","hhhat","hurtado","illumination","infomap","interope","istent","jjffipi","khosrow","lafferty","lernen","ljubljana","makarec","mbt","miguel","moreminority","nakaiwa","niblack","novel","ofcluster","oneor","orthographically","paralleel","peris","pnq","prehensive","proprietary","rabeeen","reduplication","resampl","robust","sanchis","segmentand","sheffielddepartment","sleepy","specificity","steininger","succeededin","systemoutput","templates","thece","thequechua","thrown","tor","trump","unatainable","usedto","verifica","warsaw","whiskers","wouldmake","zhuli",];
