@inproceedings{e495a598db534a1ab72db77c4c364191,
title = "Identifying queries in the wild, wild Web",
abstract = "Identifying user querying behavior is an important problem for information seeking and retrieval research. Query-related studies typically rely on server-side logs taken from a single search engine, but a comprehensive view of user querying behaviors requires analysis of data collected from the client-side for unrestricted searches. We developed three methods to identify querying behaviors and tested them on client-side logs collected in a lab experiment for realistic tasks and unrestricted searches on the entire Web. Results show that the best method was able to identify 97% of queries issued, with a precision of 92%. Although based on a relatively small number of search episodes, our methods, perhaps with minimal modifications, should be adequate for identification of queries in logs of unconstrained Web search.",
keywords = "Query identification, Query log analysis, Unrestricted search, User studies, Web search logs",
author = "Jingjing Liu and Chang Liu and Jun Zhang and Ralf Bierig and Michael Cole",
year = "2010",
doi = "10.1145/1840784.1840832",
language = "English (US)",
isbn = "9781450302470",
series = "IIiX 2010 - Proceedings of the 2010 Information Interaction in Context Symposium",
pages = "317--320",
booktitle = "IIiX 2010 - Proceedings of the 2010 Information Interaction in Context Symposium",
note = "3rd Information Interaction in Context Symposium, IIiX'10 ; Conference date: 18-08-2010 Through 21-08-2010",
}