{"id":"https://openalex.org/W4200410546","doi":"https://doi.org/10.3233/faia210326","title":"An Information Retrieval Pipeline for Legislative Documents from the Brazilian Chamber of Deputies","display_name":"An Information Retrieval Pipeline for Legislative Documents from the Brazilian Chamber of Deputies","publication_year":2021,"publication_date":"2021-12-02","ids":{"openalex":"https://openalex.org/W4200410546","doi":"https://doi.org/10.3233/faia210326"},"language":"en","primary_location":{"id":"doi:10.3233/faia210326","is_oa":true,"landing_page_url":"https://doi.org/10.3233/faia210326","pdf_url":"https://ebooks.iospress.nl/pdf/doi/10.3233/FAIA210326","source":{"id":"https://openalex.org/S4210201731","display_name":"Frontiers in artificial intelligence and applications","issn_l":"0922-6389","issn":["0922-6389","1879-8314"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in Artificial Intelligence and Applications","raw_type":"book-chapter"},"type":"book-chapter","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://ebooks.iospress.nl/pdf/doi/10.3233/FAIA210326","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5033149946","display_name":"Ellen Souza","orcid":"https://orcid.org/0000-0002-7706-4809"},"institutions":[{"id":"https://openalex.org/I17974374","display_name":"Universidade de S\u00e3o Paulo","ror":"https://ror.org/036rp1748","country_code":"BR","type":"education","lineage":["https://openalex.org/I17974374"]},{"id":"https://openalex.org/I62921916","display_name":"Universidade Federal Rural de Pernambuco","ror":"https://ror.org/02ksmb993","country_code":"BR","type":"education","lineage":["https://openalex.org/I62921916"]}],"countries":["BR"],"is_corresponding":true,"raw_author_name":"Ellen Souza","raw_affiliation_strings":["Institute of Mathematics and Computer Sciences, University of S\u00e3o Paulo, Brazil","MiningBR Research Group, Federal Rural University of Pernambuco, Brazil"],"affiliations":[{"raw_affiliation_string":"Institute of Mathematics and Computer Sciences, University of S\u00e3o Paulo, Brazil","institution_ids":["https://openalex.org/I17974374"]},{"raw_affiliation_string":"MiningBR Research Group, Federal Rural University of Pernambuco, Brazil","institution_ids":["https://openalex.org/I62921916"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018359147","display_name":"Douglas Vit\u00f3rio","orcid":"https://orcid.org/0000-0003-2285-574X"},"institutions":[{"id":"https://openalex.org/I62921916","display_name":"Universidade Federal Rural de Pernambuco","ror":"https://ror.org/02ksmb993","country_code":"BR","type":"education","lineage":["https://openalex.org/I62921916"]},{"id":"https://openalex.org/I25112270","display_name":"Universidade Federal de Pernambuco","ror":"https://ror.org/047908t24","country_code":"BR","type":"education","lineage":["https://openalex.org/I25112270"]}],"countries":["BR"],"is_corresponding":false,"raw_author_name":"Douglas Vit\u00f3rio","raw_affiliation_strings":["Centro de Inform\u00e1tica, Federal University of Pernambuco, Brazil","MiningBR Research Group, Federal Rural University of Pernambuco, Brazil"],"affiliations":[{"raw_affiliation_string":"Centro de Inform\u00e1tica, Federal University of Pernambuco, Brazil","institution_ids":["https://openalex.org/I25112270"]},{"raw_affiliation_string":"MiningBR Research Group, Federal Rural University of Pernambuco, Brazil","institution_ids":["https://openalex.org/I62921916"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045908729","display_name":"Gyovana Moriyama","orcid":null},"institutions":[{"id":"https://openalex.org/I17974374","display_name":"Universidade de S\u00e3o Paulo","ror":"https://ror.org/036rp1748","country_code":"BR","type":"education","lineage":["https://openalex.org/I17974374"]}],"countries":["BR"],"is_corresponding":false,"raw_author_name":"Gyovana Moriyama","raw_affiliation_strings":["Institute of Mathematics and Computer Sciences, University of S\u00e3o Paulo, Brazil"],"affiliations":[{"raw_affiliation_string":"Institute of Mathematics and Computer Sciences, University of S\u00e3o Paulo, Brazil","institution_ids":["https://openalex.org/I17974374"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108498528","display_name":"Luiz Carlos Santos","orcid":null},"institutions":[{"id":"https://openalex.org/I17974374","display_name":"Universidade de S\u00e3o Paulo","ror":"https://ror.org/036rp1748","country_code":"BR","type":"education","lineage":["https://openalex.org/I17974374"]}],"countries":["BR"],"is_corresponding":false,"raw_author_name":"Luiz Santos","raw_affiliation_strings":["Institute of Mathematics and Computer Sciences, University of S\u00e3o Paulo, Brazil"],"affiliations":[{"raw_affiliation_string":"Institute of Mathematics and Computer Sciences, University of S\u00e3o Paulo, Brazil","institution_ids":["https://openalex.org/I17974374"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075485252","display_name":"Lucas Martins","orcid":"https://orcid.org/0000-0001-8730-4901"},"institutions":[{"id":"https://openalex.org/I17974374","display_name":"Universidade de S\u00e3o Paulo","ror":"https://ror.org/036rp1748","country_code":"BR","type":"education","lineage":["https://openalex.org/I17974374"]}],"countries":["BR"],"is_corresponding":false,"raw_author_name":"Lucas Martins","raw_affiliation_strings":["Institute of Mathematics and Computer Sciences, University of S\u00e3o Paulo, Brazil"],"affiliations":[{"raw_affiliation_string":"Institute of Mathematics and Computer Sciences, University of S\u00e3o Paulo, Brazil","institution_ids":["https://openalex.org/I17974374"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016818881","display_name":"Mariana Barbosa de Souza","orcid":"https://orcid.org/0000-0003-0126-6284"},"institutions":[{"id":"https://openalex.org/I17974374","display_name":"Universidade de S\u00e3o Paulo","ror":"https://ror.org/036rp1748","country_code":"BR","type":"education","lineage":["https://openalex.org/I17974374"]}],"countries":["BR"],"is_corresponding":false,"raw_author_name":"Mariana Souza","raw_affiliation_strings":["Institute of Mathematics and Computer Sciences, University of S\u00e3o Paulo, Brazil"],"affiliations":[{"raw_affiliation_string":"Institute of Mathematics and Computer Sciences, University of S\u00e3o Paulo, Brazil","institution_ids":["https://openalex.org/I17974374"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078938696","display_name":"M\u00e1rcio Alves da Fonseca","orcid":"https://orcid.org/0000-0002-9361-6108"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"M\u00e1rcio Fonseca","raw_affiliation_strings":["Chamber of Deputies, Brasilia, Brazil"],"affiliations":[{"raw_affiliation_string":"Chamber of Deputies, Brasilia, Brazil","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067624407","display_name":"N\u00e1dia F\u00e9lix","orcid":null},"institutions":[{"id":"https://openalex.org/I68106152","display_name":"Universidade Federal de Goi\u00e1s","ror":"https://ror.org/0039d5757","country_code":"BR","type":"education","lineage":["https://openalex.org/I68106152"]},{"id":"https://openalex.org/I17974374","display_name":"Universidade de S\u00e3o Paulo","ror":"https://ror.org/036rp1748","country_code":"BR","type":"education","lineage":["https://openalex.org/I17974374"]}],"countries":["BR"],"is_corresponding":false,"raw_author_name":"N\u00e1dia F\u00e9lix","raw_affiliation_strings":["Institute of Informatics, Federal University of Goi\u00e1s, Brazil","Institute of Mathematics and Computer Sciences, University of S\u00e3o Paulo, Brazil"],"affiliations":[{"raw_affiliation_string":"Institute of Informatics, Federal University of Goi\u00e1s, Brazil","institution_ids":["https://openalex.org/I68106152"]},{"raw_affiliation_string":"Institute of Mathematics and Computer Sciences, University of S\u00e3o Paulo, Brazil","institution_ids":["https://openalex.org/I17974374"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079499583","display_name":"Andr\u00e9 C. P. L. F. de Carvalho","orcid":"https://orcid.org/0000-0002-4765-6459"},"institutions":[{"id":"https://openalex.org/I17974374","display_name":"Universidade de S\u00e3o Paulo","ror":"https://ror.org/036rp1748","country_code":"BR","type":"education","lineage":["https://openalex.org/I17974374"]}],"countries":["BR"],"is_corresponding":false,"raw_author_name":"Andr\u00e9 C.P.L.F. Carvalho","raw_affiliation_strings":["Institute of Mathematics and Computer Sciences, University of S\u00e3o Paulo, Brazil"],"affiliations":[{"raw_affiliation_string":"Institute of Mathematics and Computer Sciences, University of S\u00e3o Paulo, Brazil","institution_ids":["https://openalex.org/I17974374"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012164834","display_name":"Hidelberg Oliveira Albuquerque","orcid":"https://orcid.org/0000-0003-2277-8860"},"institutions":[{"id":"https://openalex.org/I25112270","display_name":"Universidade Federal de Pernambuco","ror":"https://ror.org/047908t24","country_code":"BR","type":"education","lineage":["https://openalex.org/I25112270"]},{"id":"https://openalex.org/I62921916","display_name":"Universidade Federal Rural de Pernambuco","ror":"https://ror.org/02ksmb993","country_code":"BR","type":"education","lineage":["https://openalex.org/I62921916"]}],"countries":["BR"],"is_corresponding":false,"raw_author_name":"Hidelberg O. Albuquerque","raw_affiliation_strings":["Centro de Inform\u00e1tica, Federal University of Pernambuco, Brazil","MiningBR Research Group, Federal Rural University of Pernambuco, Brazil"],"affiliations":[{"raw_affiliation_string":"Centro de Inform\u00e1tica, Federal University of Pernambuco, Brazil","institution_ids":["https://openalex.org/I25112270"]},{"raw_affiliation_string":"MiningBR Research Group, Federal Rural University of Pernambuco, Brazil","institution_ids":["https://openalex.org/I62921916"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101774965","display_name":"Adriano Oliveira","orcid":"https://orcid.org/0000-0002-7451-7366"},"institutions":[{"id":"https://openalex.org/I25112270","display_name":"Universidade Federal de Pernambuco","ror":"https://ror.org/047908t24","country_code":"BR","type":"education","lineage":["https://openalex.org/I25112270"]}],"countries":["BR"],"is_corresponding":false,"raw_author_name":"Adriano L.I. Oliveira","raw_affiliation_strings":["Centro de Inform\u00e1tica, Federal University of Pernambuco, Brazil"],"affiliations":[{"raw_affiliation_string":"Centro de Inform\u00e1tica, Federal University of Pernambuco, Brazil","institution_ids":["https://openalex.org/I25112270"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":11,"corresponding_author_ids":["https://openalex.org/A5033149946"],"corresponding_institution_ids":["https://openalex.org/I17974374","https://openalex.org/I62921916"],"apc_list":null,"apc_paid":null,"fwci":28.9855,"has_fulltext":true,"cited_by_count":16,"citation_normalized_percentile":{"value":0.99418429,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13643","display_name":"Artificial Intelligence in Law","score":0.9794999957084656,"subfield":{"id":"https://openalex.org/subfields/3320","display_name":"Political Science and International Relations"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T13643","display_name":"Artificial Intelligence in Law","score":0.9794999957084656,"subfield":{"id":"https://openalex.org/subfields/3320","display_name":"Political Science and International Relations"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10456","display_name":"Multi-Agent Systems and Negotiation","score":0.9580000042915344,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/bigram","display_name":"Bigram","score":0.817476749420166},{"id":"https://openalex.org/keywords/punctuation","display_name":"Punctuation","score":0.7594082355499268},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.7099974155426025},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7099528312683105},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6679787635803223},{"id":"https://openalex.org/keywords/preprocessor","display_name":"Preprocessor","score":0.6328586935997009},{"id":"https://openalex.org/keywords/chamber-of-deputies","display_name":"Chamber of Deputies","score":0.5502229332923889},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5256439447402954},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5233915448188782},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.45778030157089233},{"id":"https://openalex.org/keywords/legislature","display_name":"Legislature","score":0.4311577379703522},{"id":"https://openalex.org/keywords/newspaper","display_name":"Newspaper","score":0.42671093344688416},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.18810918927192688},{"id":"https://openalex.org/keywords/advertising","display_name":"Advertising","score":0.10480833053588867},{"id":"https://openalex.org/keywords/history","display_name":"History","score":0.1003713607788086},{"id":"https://openalex.org/keywords/trigram","display_name":"Trigram","score":0.0834762454032898}],"concepts":[{"id":"https://openalex.org/C108757681","wikidata":"https://www.wikidata.org/wiki/Q2773912","display_name":"Bigram","level":3,"score":0.817476749420166},{"id":"https://openalex.org/C540372491","wikidata":"https://www.wikidata.org/wiki/Q82622","display_name":"Punctuation","level":2,"score":0.7594082355499268},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.7099974155426025},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7099528312683105},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6679787635803223},{"id":"https://openalex.org/C34736171","wikidata":"https://www.wikidata.org/wiki/Q918333","display_name":"Preprocessor","level":2,"score":0.6328586935997009},{"id":"https://openalex.org/C2778964614","wikidata":"https://www.wikidata.org/wiki/Q320289","display_name":"Chamber of Deputies","level":3,"score":0.5502229332923889},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5256439447402954},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5233915448188782},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.45778030157089233},{"id":"https://openalex.org/C83009810","wikidata":"https://www.wikidata.org/wiki/Q11204","display_name":"Legislature","level":2,"score":0.4311577379703522},{"id":"https://openalex.org/C201280247","wikidata":"https://www.wikidata.org/wiki/Q11032","display_name":"Newspaper","level":2,"score":0.42671093344688416},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.18810918927192688},{"id":"https://openalex.org/C112698675","wikidata":"https://www.wikidata.org/wiki/Q37038","display_name":"Advertising","level":1,"score":0.10480833053588867},{"id":"https://openalex.org/C95457728","wikidata":"https://www.wikidata.org/wiki/Q309","display_name":"History","level":0,"score":0.1003713607788086},{"id":"https://openalex.org/C137546455","wikidata":"https://www.wikidata.org/wiki/Q3213474","display_name":"Trigram","level":2,"score":0.0834762454032898},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.0},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.3233/faia210326","is_oa":true,"landing_page_url":"https://doi.org/10.3233/faia210326","pdf_url":"https://ebooks.iospress.nl/pdf/doi/10.3233/FAIA210326","source":{"id":"https://openalex.org/S4210201731","display_name":"Frontiers in artificial intelligence and applications","issn_l":"0922-6389","issn":["0922-6389","1879-8314"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in Artificial Intelligence and Applications","raw_type":"book-chapter"}],"best_oa_location":{"id":"doi:10.3233/faia210326","is_oa":true,"landing_page_url":"https://doi.org/10.3233/faia210326","pdf_url":"https://ebooks.iospress.nl/pdf/doi/10.3233/FAIA210326","source":{"id":"https://openalex.org/S4210201731","display_name":"Frontiers in artificial intelligence and applications","issn_l":"0922-6389","issn":["0922-6389","1879-8314"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in Artificial Intelligence and Applications","raw_type":"book-chapter"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions","score":0.800000011920929}],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4200410546.pdf","grobid_xml":"https://content.openalex.org/works/W4200410546.grobid-xml"},"referenced_works_count":29,"referenced_works":["https://openalex.org/W80463681","https://openalex.org/W206042179","https://openalex.org/W207334483","https://openalex.org/W1511963917","https://openalex.org/W1594622829","https://openalex.org/W2038114184","https://openalex.org/W2085030399","https://openalex.org/W2087696423","https://openalex.org/W2097726431","https://openalex.org/W2112006025","https://openalex.org/W2121605237","https://openalex.org/W2215376118","https://openalex.org/W2228706226","https://openalex.org/W2306706380","https://openalex.org/W2338029868","https://openalex.org/W2573924519","https://openalex.org/W2618019017","https://openalex.org/W2624072012","https://openalex.org/W2792503084","https://openalex.org/W2990241252","https://openalex.org/W3015713034","https://openalex.org/W3081796136","https://openalex.org/W3106739167","https://openalex.org/W3154444249","https://openalex.org/W4205616574","https://openalex.org/W4235077579","https://openalex.org/W4251560691","https://openalex.org/W4252076394","https://openalex.org/W4288017055"],"related_works":["https://openalex.org/W3173084154","https://openalex.org/W2982021180","https://openalex.org/W2251497876","https://openalex.org/W2241081188","https://openalex.org/W2128567707","https://openalex.org/W159278796","https://openalex.org/W4327499987","https://openalex.org/W2011383762","https://openalex.org/W2035962958","https://openalex.org/W4313164761"],"abstract_inverted_index":{"This":[0],"work":[1],"investigates":[2],"information":[3],"retrieval":[4],"methods":[5],"to":[6,47,57,111,113,118,123],"address":[7],"the":[8,12,17,22,51,81,91,120],"existing":[9],"difficulties":[10],"on":[11],"Preliminary":[13],"Search,":[14],"part":[15],"of":[16,25,99],"law":[18],"making":[19],"process":[20],"from":[21,43,86],"Brazilian":[23],"Chamber":[24,44],"Deputies.":[26],"For":[27],"such,":[28],"different":[29],"preprocessing":[30],"approaches,":[31],"stemmers,":[32],"language":[33,78],"models,":[34],"and":[35,49,59,63,76],"BM25":[36],"variants":[37],"were":[38,45,55,67],"compared.":[39],"Two":[40],"legislative":[41],"corpora":[42],"used":[46],"build":[48],"validate":[50],"pipeline.":[52],"All":[53],"texts":[54],"converted":[56],"lowercase":[58],"had":[60],"stopwords,":[61],"accentuation,":[62],"punctuation":[64],"removed.":[65],"Words":[66],"represented":[68],"by":[69],"their":[70],"stem":[71],"combined":[72],"with":[73,93,104],"word":[74],"unigram":[75],"bigram":[77],"models.":[79],"Retrieving":[80],"bill":[82],"that":[83],"was":[84],"originated":[85],"a":[87,97],"specific":[88],"job":[89,115],"request,":[90],"BM25L":[92],"Savoy":[94],"stemmer":[95],"reached":[96],"R@20":[98,121],"0.7356.":[100],"After":[101],"removing":[102],"queries":[103],"inconsistencies":[105],"or":[106,117],"which":[107],"made":[108],"reference":[109],"exclusively":[110],"attachments,":[112],"other":[114],"requests,":[116],"bills,":[119],"increased":[122],"0.94.":[124]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":5},{"year":2022,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
