@inproceedings{1574bd39e53541e2910f0de0ac378c67,
title = "Prior art search using international patent classification codes and all-claims-queries",
abstract = "In this paper, we describe the system we developed for the Intellectual Property track of the 2009 Cross-Language Evaluation Forum. The track addressed prior art search for patent applications. We used the Lucene library to conduct experiments with the traditional TF-IDF-based ranking approach, indexing both the textual content and the IPC codes assigned to each document. We formulated our queries by using the title and claims of a patent application in order to measure the (weighted) lexical overlap between topics and prior art candidates. We also formulated a language-independent query using the IPC codes of a document to improve the coverage and to obtain a more accurate ranking of candidates. Using a simple model, our system remained efficient and had a reasonably good performance score: it achieved the 6th best Mean Average Precision score out of 14 participating systems on 500 topics, and the 4th best score out of 9 participants on 10,000 topics.",
author = "Benjamin Herbert and Gyoergy Szarvas and Iryna Gurevych",
year = "2010",
language = "English",
isbn = "9783642157530",
series = "Lecture Notes in Computer Science",
publisher = "Springer, Springer Nature",
pages = "452--459",
editor = "C Peters and GM DiNunzio and M Kurimo and T Mandl and D Mostefa and A Penas and G Roda",
booktitle = "Multilingual information access evaluation I: text retrieval experiments",
address = "United States",
note = "10th Workshop of the Cross-Language Evaluation Forum ; Conference date: 30-09-2009 Through 02-10-2009",
}