%%% -*-BibTeX-*- %%% ==================================================================== %%% BibTeX-file{ %%% author = "Nelson H. F. Beebe", %%% version = "1.94", %%% date = "31 January 2026", %%% time = "08:33:31 MDT", %%% filename = "tois.bib", %%% address = "University of Utah %%% Department of Mathematics, 110 LCB %%% 155 S 1400 E RM 233 %%% Salt Lake City, UT 84112-0090 %%% USA", %%% telephone = "+1 801 581 5254", %%% URL = "https://www.math.utah.edu/~beebe", %%% checksum = "29116 50062 253425 2430300", %%% email = "beebe at math.utah.edu, beebe at acm.org, %%% beebe at computer.org (Internet)", %%% codetable = "ISO/ASCII", %%% keywords = "bibliography, BibTeX, ACM Transactions on %%% Information Systems", %%% license = "public domain", %%% supported = "no", %%% docstring = "This is a COMPLETE BibTeX bibliography for %%% the journal ACM Transactions on Information %%% Systems (CODEN ATISET, ISSN 1046-8188), for %%% 1989--date. %%% %%% Publication began with volume 7, number 1, %%% in January 1989. The journal appears %%% quarterly, in January, April, July, and %%% October. Its predecessor, ACM Transactions %%% on Office Information Systems (CODEN %%% ATOSDO, ISSN 0734-2047), is covered in a %%% companion bibliography, toois.bib. %%% %%% The two journals have a joint World-Wide %%% Web site at: %%% %%% http://www.acm.org/pubs/tois %%% %%% Tables-of-contents of all issues are %%% available at: %%% %%% http://www.acm.org/pubs/contents/journals/tois/ %%% http://portal.acm.org/browse_dl.cfm?idx=J779 %%% %%% Qualified subscribers can retrieve the full %%% text of recent articles in PDF form. %%% %%% At version 1.94, the COMPLETE journal %%% coverage looked like this: %%% %%% 1989 ( 19) 2002 ( 16) 2015 ( 27) %%% 1990 ( 15) 2003 ( 16) 2016 ( 34) %%% 1991 ( 18) 2004 ( 20) 2017 ( 50) %%% 1992 ( 18) 2005 ( 16) 2018 ( 23) %%% 1993 ( 20) 2006 ( 19) 2019 ( 49) %%% 1994 ( 21) 2007 ( 25) 2020 ( 42) %%% 1995 ( 19) 2008 ( 27) 2021 ( 55) %%% 1996 ( 17) 2009 ( 18) 2022 ( 88) %%% 1997 ( 15) 2010 ( 28) 2023 ( 116) %%% 1998 ( 15) 2011 ( 16) 2024 ( 165) %%% 1999 ( 16) 2012 ( 27) 2025 ( 168) %%% 2000 ( 11) 2013 ( 22) 2026 ( 29) %%% 2001 ( 14) 2014 ( 21) %%% %%% Article: 1334 %%% Proceedings: 1 %%% %%% Total entries: 1335 %%% %%% The initial draft of this bibliography was %%% derived from data at the ACM Web site. It %%% was then augmented with data from the %%% Compendex and OCLC Contents1st databases, %%% and from the huge Karlsruhe computer %%% science bibliography archive. There were a %%% surprisingly large number of discrepancies %%% (in more than a third of the entries) in %%% these sources, but they have been resolved %%% by consulting the original journal issues. %%% %%% ACM copyrights explicitly permit abstracting %%% with credit, so article abstracts, keywords, %%% and subject classifications have been %%% included in this bibliography wherever %%% available. %%% %%% The bibsource keys in the bibliography %%% entries below indicate the data sources. %%% %%% URL keys in the bibliography point to %%% World Wide Web locations of additional %%% information about the entry. %%% %%% Spelling has been verified with the UNIX %%% spell and GNU ispell programs using the %%% exception dictionary stored in the %%% companion file with extension .sok. %%% %%% BibTeX citation tags are uniformly chosen %%% as name:year:abbrev, where name is the %%% family name of the first author or editor, %%% year is a 4-digit number, and abbrev is a %%% 3-letter condensation of important title %%% words. Citation tags were automatically %%% generated by software developed for the %%% BibNet Project. %%% %%% In this bibliography, entries are sorted in %%% publication order, using ``bibsort -byvolume.'' %%% %%% The checksum field above contains a CRC-16 %%% checksum as the first value, followed by the %%% equivalent of the standard UNIX wc (word %%% count) utility output of lines, words, and %%% characters. This is produced by Robert %%% Solovay's checksum utility.", %%% } %%% ==================================================================== @Preamble{ "\input bibnames.sty" # "\hyphenation{Chem-u-du-gun-ta Kou-ba-ra-kis San-kar-a-na-ray-a-nan Yan-kel-o-vich}" } %%% ==================================================================== %%% Acknowledgement abbreviations: @String{ack-nhfb = "Nelson H. F. Beebe, University of Utah, Department of Mathematics, 110 LCB, 155 S 1400 E RM 233, Salt Lake City, UT 84112-0090, USA, Tel: +1 801 581 5254, e-mail: \path|beebe@math.utah.edu|, \path|beebe@acm.org|, \path|beebe@computer.org| (Internet), URL: \path|https://www.math.utah.edu/~beebe/|"} %%% ==================================================================== %%% Journal abbreviations: @String{j-TOIS = "ACM Transactions on Information Systems"} %%% ==================================================================== %%% Publisher abbreviations: @String{pub-ACM = "ACM Press"} @String{pub-ACM:adr = "New York, NY 10036, USA"} %%% ==================================================================== %%% Bibliography entries: @Article{Allen:1989:ENN, author = "R. B. Allen", title = "Editorial: a New Name --- {ACM Transactions on Information Systems}", journal = j-TOIS, volume = "7", number = "1", pages = "1--2", month = jan, year = "1989", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 16:21:56 MST 1999", bibsource = "ftp://ftp.ira.uka.de/pub/bibliography/Database/Graefe.bib; http://liinwww.ira.uka.de/bibliography/Database/Graefe.html; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "With this issue the Transactions becomes the ACM Transaction on Information Systems (TOIS). In addition, TOIS' charter has been expanded to formally include the field of Information Retrieval. These changes affirm the broad scope that the journal has been pursuing in recent years. As before, a wide variety of perspectives on information systems will be considered, including topics such as user and organizational interfaces, data models, system organization, knowledge bases, and new media. Of course, TOIS will also continue to examine the uses and impact of information systems. Thus, papers in areas such as electronic publishing, interactive video services, large text archives, UIMSs, intelligent tutoring systems, and cooperative work are encouraged. TOIS is primarily a research journal with an emphasis on quality and originality, as well as relevance. Moreover, TOIS has a Practice and Experience Section for papers that present novel insights without the usual rigor of Research Contributions. Together, the Associate Editors and I are committed to keeping TOIS the premier publication in its field. We will also strive to make TOIS a testbed for new information systems.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Stotts:1989:PNB, author = "P. David Stotts and Richard Furuta", title = "{Petri} Net Based Hypertext: Document Structure with Browsing Semantics", journal = j-TOIS, volume = "7", number = "1", pages = "3--29", month = jan, year = "1989", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; ftp://ftp.ira.uka.de/pub/bibliography/Database/Graefe.bib; http://liinwww.ira.uka.de/bibliography/Database/Graefe.html; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "We present a formal definition of the Trellis model of hypertext and describe an authoring and browsing prototype called $\alpha$ Trellis that is based on the model. The Trellis model not only represents the relationships that tie individual pieces of information together into a document (i.e., the adjacencies), but specifies the browsing semantics to be associated with the hypertext as well (i.e., the manner in which the information is to be visited and presented). The model is based on Petri nets, and is a generalization of existing directed graph-based forms of hypertext. The Petri net basis permits more powerful specification of what is to be displayed when a hypertext is browsed and permits application of previously developed Petri net analysis techniques to verify properties of the hypertext. A number of useful hypertext constructs, easily described in the Trellis model, are presented. These include the synchronization of simultaneous traversals of separate paths through a hypertext, the incorporation of access controls into a hypertext (i.e., specifying nodes that can be proven to be accessible only to certain classes of browsers), and construction of multiple specialized (tailored) versions from a single hypertext.", acknowledgement = ack-nhfb, affiliation = "Univ of Maryland", affiliationaddress = "College Park, MD, USA", classification = "723; 903", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Access controls; Browsing semantics; Browsing Semantics; Computation by abstract devices; Database Systems; Design; Formal models; Hypertext; Inf. storage and retrieval; Information Retrieval; Information Science; Languages; Miscellaneous; Models of computation; Petri nets; Petri Nets; Synchronization; Systems and software; Text processing; Theory; Trellis Model; Trellis model of hypertext", } @Article{Egan:1989:FDE, author = "Dennis E. Egan and Joel R. Remde and Louis M. Gomez and Thomas K. Landauer and Jennifer Eberhardt and Carol C. Lochbaum", title = "Formative Design-Evaluation of {SuperBook}", journal = j-TOIS, volume = "7", number = "1", pages = "30--57", month = jan, year = "1989", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; ftp://ftp.ira.uka.de/pub/bibliography/Database/Graefe.bib; http://liinwww.ira.uka.de/bibliography/Database/Graefe.html; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "SuperBook is a hypertext browsing system designed to improve the usability of conventional documents. This work is a case study of formative design-evaluation. Behavioral evaluation of the first version of SuperBook showed how design factors and user strategies affected search and established baseline performance measures with printed text. The second version of SuperBook was implemented with the goal of improving search accuracy and speed. User strategies that had proved effective in the first study were made very easy and attractive to use. System response time for common operations was greatly improved. Behavioral evaluation of the new SuperBook demonstrated its superiority to printed text and suggested additional improvements that were incorporated into `MiteyBook,' a SuperBook implementation for PC-size screens. Search with MiteyBook proved to be approximately 25 percent faster and 25 percent more accurate than that obtained with a conventional printed book.", acknowledgement = ack-nhfb, affiliation = "Bellcore", affiliationaddress = "Morristown, NJ, USA", classification = "723; 903", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Database Systems; Documentation; Evaluation; Human factors; Hypertext; Inf. storage and retrieval; Information Retrieval; Information Retrieval Systems; Information Science; Information search; Information systems applications; Models and principles; Office automation; SuperBook; Systems and software; User/machine systems", wwwauthor = "D. E. Egan and J. R. Remde and J. M. Gomez and T. K. Landauer and J. Eberhardt and C. C. Lochbaum", } @Article{Utting:1989:COH, author = "Kenneth Utting and Nicole Yankelovich", title = "Context and Orientation in Hypermedia Networks", journal = j-TOIS, volume = "7", number = "1", pages = "58--84", month = jan, year = "1989", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; ftp://ftp.ira.uka.de/pub/bibliography/Database/Graefe.bib; http://liinwww.ira.uka.de/bibliography/Database/Graefe.html; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "The core of hypermedia's power lies in the complex networks of links that can be created within and between documents. However, these networks frequently overwhelm the user and become a source of confusion. Within Intermedia, we have developed the Web View --- a tool for viewing and navigating such networks with a minimum of user confusion and disorientation. The key factors in the Web View's success are a display that combines a record of the user's path through the network with a map of the currently available links; a scope line that summarizes the number of documents and links in the network; and a set of commands that permit the user to open documents directly from the Web View.", acknowledgement = ack-nhfb, affiliation = "Brown Univ", affiliationaddress = "Providence, RI, USA", classification = "723; 903", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Database Systems; Human factors; Hypermedia Networks; Hypermedia systems; Hypertext systems; Inf. storage and retrieval; Information Retrieval; Information Science; Network browsers; Sys. and software; Web View", wwwauthor = "N. Yankelovich and K. Utting", } @Article{Tompa:1989:DMF, author = "Frank Wm. Tompa", title = "A Data Model for Flexible Hypertext Database Systems", journal = j-TOIS, volume = "7", number = "1", pages = "85--100", month = jan, year = "1989", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; ftp://ftp.ira.uka.de/pub/bibliography/Database/Graefe.bib; http://liinwww.ira.uka.de/bibliography/Database/Graefe.html; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "Hypertext and other page-oriented databases cannot be-schematized in the same manner as record-oriented databases. As a result, most hypertext database implicitly employ a data model based on a simple, unrestricted graph. This paper presents a hypergraph model for maintaining page-oriented database in such a way that some of the functionality traditionally provided by database schemes can be available to hypertext database. In particular, the model formalizes identification of commonality in the structure, set-at-a-time database access, and definition of user-specific views. An efficient implementation of the model is also discussed.", acknowledgement = ack-nhfb, affiliation = "Univ of Waterloo", affiliationaddress = "Waterloo, Ont, Can", classification = "723; 903", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Data manipulation languages (DML); Data models; Data Models; Database management; Database Systems; Design; Directed Hypergraphs; Directed hypergraphs; Hypertext; Information Retrieval; Information Science; Information storage; Information storage and retrieval; Languages; Logical design; Text Management; Text management; Videotex databases", } @Article{Sciore:1989:OS, author = "Edward Sciore", title = "Object Specialization", journal = j-TOIS, volume = "7", number = "2", pages = "103--122", month = apr, year = "1989", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; ftp://ftp.ira.uka.de/pub/bibliography/Database/Graefe.bib; http://liinwww.ira.uka.de/bibliography/Database/Graefe.html; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "Specialization hierarchies typically are treated as type-level constructs and are used to define various inheritance mechanisms. In this paper we consider specialization at the level of objects. We show that doing so creates a more flexible and powerful notion of inheritance by allowing objects to define their own inheritance path. Object specialization can also be used to model certain forms of versioning, implement data abstraction, and provide a `classless' prototype-based language interface to the user.", acknowledgement = ack-nhfb, affiliation = "Boston Univ", affiliationaddress = "Boston, MA, USA", classification = "723", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Artificial intelligence; Computer Interfaces; Computer Programming Languages; Database management; Database Systems; Deduction and theorem proving; Delegation; Design; Inheritance; Language constructs; Language Constructs; Languages; Object Oriented Database; Object-oriented database; Programming languages; Specialization Hierarchies; Theory", wwwpages = "103--123", } @Article{Guting:1989:ASO, author = "Ralf Hartmut Guting and Roberto Zicari and David M. Choy", title = "An Algebra for Structured Office Documents", journal = j-TOIS, volume = "7", number = "2", pages = "123--157", month = apr, year = "1989", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; ftp://ftp.ira.uka.de/pub/bibliography/Database/Graefe.bib; http://liinwww.ira.uka.de/bibliography/Database/Graefe.html; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "We describe a data model for structured office information objects, which we generically call `documents,' and a practically useful algebraic language for the retrieval and manipulation of such objects. Documents are viewed as hierarchical structures; their layout (presentation) aspect is to be treated separately. The syntax and semantics of the language are defined precisely in terms of the formal model, an extended relational algebra. The proposed approach has several new features, some of which are particularly useful for the management of office information. The data model is based on nested sequences of tuples rather than nested relations. Therefore, sorting and sequence operations and the explicit handling of duplicates can be described by the model. Furthermore, this is the first model based on a many-sorted instead of a one-sorted algebra, which means that atomic data values as well as nested structures are objects of the algebra. As a consequence, arithmetic operations, aggregate functions, and so forth can be treated inside the model.", acknowledgement = ack-nhfb, affiliation = "Univ of Dortmund", affiliationaddress = "Dortmund, West Ger", classification = "723", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Data models; Data Models; Database applications; Database management; Database Systems; Extended relational algebra; Forms processing; Information systems applications; Languages; Logical design; Management; Many-sorted algebra; Miscellaneous; Nested relations; Office automation; Office Automation; Query languages; Query Languages; Relational; Relational Algebra; Structured document; Theory; Tuple sequences", } @Article{Lee:1989:PSF, author = "Dik Lun Lee and Chun-Wu Leng", title = "Partitioned Signature Files: Design Issues and Performance Evaluation", journal = j-TOIS, volume = "7", number = "2", pages = "158--180", month = apr, year = "1989", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; ftp://ftp.ira.uka.de/pub/bibliography/Database/Graefe.bib; http://liinwww.ira.uka.de/bibliography/Database/Graefe.html; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "A signature file acts as a filtering mechanism to reduce the amount of text that needs to be searched for a query. Unfortunately, the signature file itself must be exhaustively searched, resulting in degraded performance for a large file size. We propose to use a deterministic algorithm to divide a signature file into partitions, each of which contains signatures with the same `key.' The signature keys in a partition can be extracted and represented as the partition's key. The search can then be confined to the subset of partitions whose keys match the query key. Our main concern here is to study methods for obtaining the keys and their performance in terms of their ability to reduce the search space. We outline the criteria for evaluating partitioning schemes. Three algorithms are described and studied. An analytical study of the performance of the algorithms is provided, and the results are verified with simulation.", acknowledgement = ack-nhfb, affiliation = "Ohio State Univ", affiliationaddress = "Columbus, OH, USA", classification = "723; 903", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Access method; Access methods; Codes; Computer Programming--Algorithms; Computer Simulation; Data Processing--File Organization; Database management; Database Systems; Design; Document retrieval; Inf. storage and retrieval; Information retrieval; Information Retrieval; Information Science; Information systems applications; Library automation; Office automation; Parallel search; Parallel Search; Partitioned Signature Files; Performance; Performance evaluation; Physical design; Superimposed coding; Superimposed Coding; Surrogate file; Symbolic; Text editing; Text processing; Text retrieval", wwwtitle = "Partitioned Signature File: Design Issues and Performance Evaluation", } @Article{Croft:1989:EIS, author = "W. B. Croft", title = "Editorial: Introduction to the Special Issue", journal = j-TOIS, volume = "7", number = "3", pages = "181--182", month = jul, year = "1989", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 16:21:56 MST 1999", bibsource = "ftp://ftp.ira.uka.de/pub/bibliography/Database/Graefe.bib; http://liinwww.ira.uka.de/bibliography/Database/Graefe.html; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", note = "Special Issue on Research and Development in Information Retrieval.", URL = "http://www.acm.org:80", abstract = "This Special Issue contains selected papers from the SIGIR Conference on Research and Development in Information Retrieval held at Cambridge, Massachusetts in June, 1989. The papers were selected by the program committee and revised for publication in TOIS. Information retrieval is a diverse field of research, and the areas covered at this conference include formal models, search strategies, hypermedia, storage structures, evaluation, natural language processing, interfaces, and knowledge-based architectures. The unifying goal of this research is the efficient and effective retrieval of complex, multimedia objects, with a primary focus on text documents.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Fuhr:1989:OPR, author = "Norbert Fuhr", title = "Optimum Polynomial Retrieval Functions Based on the Probability Ranking Principle", journal = j-TOIS, volume = "7", number = "3", pages = "183--204", month = jul, year = "1989", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; ftp://ftp.ira.uka.de/pub/bibliography/Database/Graefe.bib; http://liinwww.ira.uka.de/bibliography/Database/Graefe.html; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", note = "Special Issue on Research and Development in Information Retrieval.", URL = "http://www.acm.org:80", abstract = "We show that any approach to developing optimum retrieval functions is based on two kinds of assumptions: first, a certain form of representation for documents and requests, and second, additional simplifying assumptions that predefine the type of the retrieval function. We describe an approach for the development of optimum polynomial retrieval functions. We give experimental results for the application of this approach to documents with weighted indexing as well as to documents with complex representations. In contrast to other probabilistic models, our approach yields estimates of the actual probabilities, it can handle very complex representations of documents and requests, and it can be easily applied to multivalued relevance scales.", acknowledgement = ack-nhfb, affiliation = "Technische Hochschule Darmstadt", affiliationaddress = "Darmstadt, West Ger", classification = "903; 922", conference = "SIGIR Conference on Research and Development in Information Retrieval", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Approximation; Complex Document Representation; Complex document representation; Content analysis and indexing; Indexing methods; Information Retrieval Systems; Information Science --- Information Retrieval; Information search and retrieval; Information storage and retrieval; Least squares approximation; Linear Retrieval Functions; Linear retrieval functions; Multivalued Relevance Scales; Multivalued relevance scales; Numerical analysis; Optimum Retrieval; Probabilistic Indexing; Probabilistic indexing; Probabilistic retrieval; Probability; Probability Ranking Principle; Probability ranking principle; Retrieval methods Experimentation; Theory", meetingaddress = "Cambridge, MA, USA", meetingdate = "Jun 1989", meetingdate2 = "06/89", wwwtitle = "Optimal Polynomial Retrieval Functions Based on the Probability Ranking Principle", } @Article{Raghavan:1989:CIR, author = "Vijay V. Raghavan and Gwang S. Jung and Peter Bollmann", title = "A Critical Investigation of Recall and Precision as Measures of Retrieval System Performance", journal = j-TOIS, volume = "7", number = "3", pages = "205--229", month = jul, year = "1989", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; ftp://ftp.ira.uka.de/pub/bibliography/Database/Graefe.bib; http://liinwww.ira.uka.de/bibliography/Database/Graefe.html; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", note = "Special Issue on Research and Development in Information Retrieval.", URL = "http://www.acm.org:80", abstract = "Recall and precision are often used to evaluate the effectiveness of information retrieval systems. They are easy to define if there is a single query and if the retrieval result generated for the query is a linear ordering. However, when the retrieval results are weakly ordered, in the sense that several documents have an identical retrieval status value with respect to a query, some probabilistic notion of precision has to be introduced. We systematically investigate the various problems and issues associated with the use of recall and precision as measures of retrieval system performance. Our motivation is to provide a comparative analysis of methods available for defining precision in a probabilistic sense and to promote a better understanding of the various issues involved in retrieval performance evaluation.", acknowledgement = ack-nhfb, affiliation = "Univ of Southwestern Louisiana", affiliationaddress = "Lafayette, LA, USA", classification = "903; 922", conference = "SIGIR Conference on Research and Development in Information Retrieval", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Evaluation measures; Expected precision; Expected Search Length; Expected search length; Experimentation; Fallout; General; Generality; Inf. storage and retrieval; Information Retrieval; Information retrieval; Information Retrieval Systems --- Evaluation; Information Science; Information search and retrieval; Information storage and retrieval; Measurement; Miscellaneous; Performance; Performance measurement; Precision; Probabilistic Notion; Probability; Probability of relevance; Recall; Retrieval models; Retrieval Models; Retrieval System Performance; Stopping criterion; Systems evaluation; Theory", meetingaddress = "Cambridge, MA, USA", meetingdate = "Jun 1989", meetingdate2 = "06/89", } @Article{Klein:1989:STR, author = "Shmuel T. Klein and Abraham Bookstein and Scott Deerwester", title = "Storing Text Retrieval Systems on {CD-ROM}. Compression and Encryption Considerations", journal = j-TOIS, volume = "7", number = "3", pages = "230--245", month = jul, year = "1989", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; ftp://ftp.ira.uka.de/pub/bibliography/Database/Graefe.bib; http://liinwww.ira.uka.de/bibliography/Database/Graefe.html; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", note = "Special Issue on Research and Development in Information Retrieval.", URL = "http://www.acm.org:80", abstract = "The emergence of the CD-ROM as a storage medium for full-text databases raises the question of the maximum size database that can be contained by this medium. As an example, the problem of storing the Tr{\'e}sor de la Langue Fran{\c{c}}aise on a CD-ROM is examined. Pertinent approaches to compression of the various files are reviewed, and the compression of the text is related to the problem of data encryption: Specifically, it is shown that, under simple models of text generation, Huffman encoding produces a bit-string indistinguishable from a representation of coin flips.", acknowledgement = ack-nhfb, affiliation = "Univ of Chicago", affiliationaddress = "Chicago, IL, USA", classification = "723; 741; 903", conference = "SIGIR Conference on Research and Development in Information Retrieval", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Algorithms; Arts and humanities; Bit-maps; cd-rom; CD-ROM; Coding and information theory; Computer applications; Cryptography; Data; Data encryption; Data Encryption; Data Storage; Full-Text Storage; Full-text storage; Huffman Coding; Huffman coding; Inf. storage and retrieval; Information Retrieval Systems --- Database Systems; Information storage; Information Theory --- Data Compression; Optical; Security; Storage Devices; Text Retrieval Systems", meetingaddress = "Cambridge, MA, USA", meetingdate = "Jun 1989", meetingdate2 = "06/89", wwwtitle = "String Text Retrieval Systems on {CD-ROM}: Compression and Encryption Considerations", } @Article{Smith:1989:KBS, author = "Philip J. Smith and Steven J. Shute and Deb Galdes and Mark H. Chignell", title = "Knowledge-Based Search Tactics for an Intelligent Intermediary System", journal = j-TOIS, volume = "7", number = "3", pages = "246--270", month = jul, year = "1989", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; ftp://ftp.ira.uka.de/pub/bibliography/Database/Graefe.bib; http://liinwww.ira.uka.de/bibliography/Database/Graefe.html; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", note = "Special Issue on Research and Development in Information Retrieval.", URL = "http://www.acm.org:80", abstract = "Research on the nature of knowledge-based systems for bibliographic information retrieval is summarized. Knowledge-based search tactics are then considered in terms of their role in the functioning of a semantically based search system for bibliographic information retrieval, EP-X. This system uses such tactics to actively assist users in defining or refining their topics of interest. It does so by applying these tactics to a knowledge base describing topics in a particular domain and to a database describing the contents of individual documents in terms of these topics. This paper, then, focuses on the two central concepts behind EP-X: semantically based search and knowledge-based search tactics.", acknowledgement = ack-nhfb, affiliation = "The Ohio State Univ", affiliationaddress = "Columbus, OH, USA", classification = "723; 903", conference = "SIGIR Conference on Research and Development in Information Retrieval", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Artificial Intelligence; Artificial intelligence; Bibliographic Information Retrieval; Bibliographic information retrieval; Database Systems; Document Retrieval; Document retrieval; Frames and scripts; Human factors; Inf. storage and retrieval; Information Retrieval; Information Retrieval Systems --- Computer Aided Analysis; Information Science; Information search and retrieval; Knowledge Representation; Knowledge representation formalisms and methods; Knowledge-Based Search; Knowledge-based search tactics; Knowledge-Based Systems; Knowledge-based systems; Models and principles; Search process; Semantically Based Search; Semantically based search; User/machine systems", meetingaddress = "Cambridge, MA, USA", meetingdate = "Jun 1989", meetingdate2 = "06/89", wwwtitle = "Knowledge-Based Search Tactics for an Intelligent Intermediary", } @Article{Campagnoni:1989:IRU, author = "F. R. Campagnoni and Kate Ehrlich", title = "Information Retrieval Using a Hypertext-Based Help System", journal = j-TOIS, volume = "7", number = "3", pages = "271--291", month = jul, year = "1989", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; ftp://ftp.ira.uka.de/pub/bibliography/Database/Graefe.bib; http://liinwww.ira.uka.de/bibliography/Database/Graefe.html; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", note = "Special Issue on Research and Development in Information Retrieval.", URL = "http://www.acm.org:80", abstract = "A study was conducted on information retrieval using a commercial hypertext-based help system. It was found that the predominant search strategy was `browsing', rather than employing the indexes. Individuals with better spatial visualization skills were faster at retrieving information than those with poorer spatial visualization skills. These results support previous studies that have found a strong preference by users for browsing in hypertext systems and extend those findings to a new domain (help), a different type of user interface, and a different information architecture.", acknowledgement = ack-nhfb, affiliation = "Sun Microsystems, Inc", affiliationaddress = "Billerica, MA, USA", classification = "723; 903", conference = "SIGIR Conference on Research and Development in Information Retrieval", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Computer Graphics --- Interactive; Documentation; Graphical User Interfaces; Help Systems; Help systems; Human factors; Hypertext; Individual differences; Inf. storage and retrieval; Information Retrieval; Information Retrieval Systems --- Online Searching; Information Science; Information Search; Information search and retrieval; Models and principles; Search process; Spatial Visualization; User/machine systems; Visualization", meetingaddress = "Cambridge, MA, USA", meetingdate = "Jun 1989", meetingdate2 = "06/89", wwwauthor = "F. R. Campagnoi and K. Ehrlich", } @Article{Metzler:1989:COP, author = "Douglas P. Metzler and Stephanie W. Haas", title = "The Constituent Object Parser: Syntactic Structure Matching for Information Retrieval", journal = j-TOIS, volume = "7", number = "4", pages = "292--316", month = oct, year = "1989", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; ftp://ftp.ira.uka.de/pub/bibliography/Database/Graefe.bib; http://liinwww.ira.uka.de/bibliography/Database/Graefe.html; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "The Constituent Object Parser is a shallow syntactic parser designed to produce dependency tree representations of syntactic structure that can be used to specify the intended meanings of a sentence more precisely than can the key terms of the sentence alone. It is intended to improve the precision/ recall performance of information retrieval and similar text processing applications by providing more powerful matching procedures. The dependency tree representation and the relationship between the intended use of this parser and its design is described, and several problems concerning the processing and ambiguous structures are discussed.", acknowledgement = ack-nhfb, affiliation = "Univ of Pittsburgh", affiliationaddress = "Pittsburgh, PA, USA", classification = "721; 723; 903", conference = "SIGIR Conference on Research and Development in Information Retrieval", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Artificial intelligence; Automata Theory --- Grammars; Content analysis and indexing; Dependency-based parsing; Design; Inf. storage and retrieval; Information Retrieval; Information Retrieval Systems; Information Science; Information storage and retrieval; Language Parsing; Language parsing and understanding; Linguistic processing; Linguistic Processing; Natural language processing; Natural Language Processing; Precision; Query Formulation; Query formulation; Relevancy judgments; Retrieval models; Search and retrieval; Selection process; Syntactic Structure Matching; Text Analysis; Text analysis", meetingaddress = "Cambridge, MA, USA", meetingdate = "Jun 1989", meetingdate2 = "06/89", } @Article{Olson:1989:WHC, author = "Margrethe H. Olson", title = "Work at Home for Computer Professionals. Current Attitudes and Future Prospects", journal = j-TOIS, volume = "7", number = "4", pages = "317--338", month = oct, year = "1989", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; ftp://ftp.ira.uka.de/pub/bibliography/Database/Graefe.bib; http://liinwww.ira.uka.de/bibliography/Database/Graefe.html; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "The article reports on two studies of work at home: a quasi-experimental field study of organizational telecommuting pilot programs, and an attitude survey comparing computer professionals who work at home to employees doing similar jobs in traditional office settings. The results of the field study demonstrated that working in the home had little impact on employee performance; however, supervisors were not comfortable with remote workers and preferred their employees to be on site. In the survey, work in the home was related to lower job satisfaction, lower organizational commitment, and higher role conflict. The survey also included computer professionals who worked at home in addition to the regular work day. The author suggests that performing additional unpaid work in the home after regular work hours may be an important trend that merits further investigation. The studies demonstrate that while computer and communications technology have the potential to relax constraints on information work in terms of space and time, in today's traditional work environments, corporate culture and management style limit acceptance of telecommuting as a substitute for office work.", acknowledgement = ack-nhfb, affiliation = "New York Univ", affiliationaddress = "New York, NY, USA", classification = "716; 718; 723; 901; 912", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Computers; Computers and society; Computing Profession; Employment; Human factors; Management; Occupations; Office Automation; Organizational impacts; Performance; Personal; Personnel; Social issues; Technology--Economic and Sociological Effects; Telecommunication; Telecommuting; The computing profession", wwwtitle = "Remote Work and Information Technology: Impacts on Organizations and Individuals", } @Article{Afsarmanesh:1989:EOO, author = "Hamideh Afsarmanesh and Dennis McLeod", title = "The {3DIS}: An Extensible, Object-Oriented Information Management Environment", journal = j-TOIS, volume = "7", number = "4", pages = "339--377", month = oct, year = "1989", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; ftp://ftp.ira.uka.de/pub/bibliography/Database/Graefe.bib; http://liinwww.ira.uka.de/bibliography/Database/Graefe.html; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "The 3-Dimensional Information Space (3DIS) is an extensible object-oriented framework for information management. It is specifically oriented toward supporting the database requirements for data-intensive information system applications in which (1) information objects of various levels of abstraction and modalities must be accommodated, (2) descriptive and structural information (metadata) is rich and dynamic, and (3) users who are not database experts must be able to design, manipulate, and evolve databases. In response to these needs, the 3DIS provides an approach in which data and the descriptive information about data are handled uniformly in an extensible framework. The 3DIS provides a simple, geometric, and formal representation of data which forms a basis for understanding, defining, and manipulating databases. Several prototype implementations based upon the 3DIS have been designed and implemented and are in experimental use.", acknowledgement = ack-nhfb, affiliation = "California State Univ", affiliationaddress = "Carson, CA, USA", classification = "723", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Algorithms; Data models; Database management; Database Systems; Design; Extensible database systems; Extensible Database Systems; Information Management; Information systems applications; Knowledge representation; Languages; Logical design; Management; Object-oriented databases; Object-Oriented Databases; Office automation; Office Automation; Office automation systems; Office Information Systems; Schema and subschema; Systems", } @Article{Pernici:1989:CTA, author = "B. Pernici and F. Barbic and M. G. Fugini and R. Maiocchi and J. R. Rames and C. Rolland", title = "{C-TODOS}: An Automatic Tool for Office System Conceptual Design", journal = j-TOIS, volume = "7", number = "4", pages = "378--419", month = oct, year = "1989", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; ftp://ftp.ira.uka.de/pub/bibliography/Database/Graefe.bib; http://liinwww.ira.uka.de/bibliography/Database/Graefe.html; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "Designers of office information systems, which share various features with information systems and software development, need to carefully consider special issues such as document and communication flows, user roles, user interfaces, and available technology. The ESPRIT Project, Automatic Tools for Designing Office Information Systems (TODOS), proposes an integrated environment for office design with tools for requirements collection and analysis, conceptual design, rapid prototyping, and architecture selection. C-TODOS, the conceptual design support tool developed within TODOS, is presented in this paper. The purpose of C-TODOS is to give the designer tools for supporting conceptual modeling activities with the goal of obtaining correct, consistent, and good quality office-functional specifications. This paper presents C-TODOS within the TODOS development environment and describes the basic features of the tool: the TODOS Conceptual Model, the Specification Database, and the Modeling, Query and Consistency Checking Modules. The use of C-TODOS, through illustration of the development of a test case, and possible future research are discussed.", acknowledgement = ack-nhfb, affiliation = "Politecnico di Milano", affiliationaddress = "Milan, Italy", classification = "723", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Analysis and design of systems; C-TODOS; Computer Software--Design; Database management; Design; Design method; Design tool; Documentation; Information Systems; Languages; Logical design; Management of computing and information systems; Methodologies; Office Automation; Office automation systems; Office Information Systems; Query languages; Requirements/specifications; Schema and subschema; Semantic model; Semantic query language; Software development; Software engineering; Software management; Specification database; Tools", } @Article{Lee:1990:PSV, author = "Jintae Lee and Thomas W. Malone", title = "Partially Shared Views: a Scheme for Communicating among Groups that Use Different Type Hierarchies", journal = j-TOIS, volume = "8", number = "1", pages = "1--26", month = jan, year = "1990", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; ftp://ftp.ira.uka.de/pub/bibliography/Database/Graefe.bib; http://liinwww.ira.uka.de/bibliography/Database/Graefe.html; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "Many computer systems are based on various types of messages, forms, or other objects. When users of such systems need to communicate with people who use different object types, some kind of translation is necessary. In this paper, we explore the space of general solutions to this translation problem and propose a scheme that synthesizes these solutions. A key insight of the analysis is that partially shared type hierarchies allow `foreign' object types to be automatically translated into their nearest common `ancestor' types. The partial interoperability attained in this way makes possible flexible standards from which people can benefit from whatever agreements they do have without having to agree on everything. Even though our examples deal primarily with extension to the Object Lens system, the analysis suggests how other kinds of systems, such as EDI applications, might exploit specialization hierarchies of object types to simplify the translation problem.", acknowledgement = ack-nhfb, affiliation = "Massachusetts Inst of Technology", affiliationaddress = "Cambridge, MA, USA", classification = "722; 723", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Applications and expert systems; Artificial intelligence; Communication; Communications applications; Computer Software; Computer Supported Cooperative Work; Computer supported cooperative work; Computer Systems; Data; Design; Digital; Distributed; Distributed systems; Electronic mail; Files; General; Hierarchical systems; Information Lens; Information systems; Information systems applications; Languages; Management; Management of computing and information systems; Modules and interfaces; Object Lens; Object Lens System; Object Types; Office automation; Operating systems; Organization and design; Organization and structure; Partially Shared Views; Partially shared views; Software configuration management; Software engineering; Software libraries; Software management; Standardization; System management; Tools and techniques", wwwtitle = "How Can Groups Communicate when They Use Different Languages", } @Article{Bookstein:1990:CIT, author = "Abraham Bookstein and Shmuel T. Klein", title = "Compression, Information Theory, and Grammars: a Unified Approach", journal = j-TOIS, volume = "8", number = "1", pages = "27--49", month = jan, year = "1990", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; ftp://ftp.ira.uka.de/pub/bibliography/Database/Graefe.bib; http://liinwww.ira.uka.de/bibliography/Database/Graefe.html; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "We propose the notion of a formal grammar as a flexible model of text generation that encompasses most of the models offered before as well as, in principle, extending the possibility of compression to a much more general class of languages. Assuming a general model of text generation, a derivation is given of the well known Shannon entropy formula, making possible a theory of information based upon text representation rather than on communication. The ideas are shown to apply to a number of commonly used text models. Finally, we focus on a Markov model of text generation, suggest an information theoretic measure of similarity between two probability distributions, and develop a clustering algorithm based on this measure. This algorithm allows us to cluster Markov states and thereby base our compression algorithm on a smaller number of probability distributions than would otherwise have been required. A number of theoretical consequences of this approach to compression are explored, and a detailed example is given.", acknowledgement = ack-nhfb, affiliation = "Univ of Chicago", affiliationaddress = "Chicago, IL, USA", classification = "721; 723; 922", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Algorithms; Artificial intelligence; Automata Theory--Grammars; Codes; Coding and information theory; Computer Programming--Algorithms; Data; Data compaction and compression; Data Compression; Huffman coding; Huffman Coding; Information storage; Information storage and retrieval; Information theory; Information Theory; Language Generation; Markov model of language generation; Markov Models; Models and principles; Natural language processing; Probability--Random Processes; Symbolic--Encoding; Systems and information theory; Theory", } @Article{Hammainen:1990:DFM, author = "Heikki Hammainen and Eero Eloranta and Jari Alasuvanto", title = "Distributed Form Management", journal = j-TOIS, volume = "8", number = "1", pages = "50--76", month = jan, year = "1990", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; ftp://ftp.ira.uka.de/pub/bibliography/Database/Graefe.bib; http://liinwww.ira.uka.de/bibliography/Database/Graefe.html; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "An open architecture for distributed form management is described. The model employs object-orientation in describing organizational units as well as individual users as entities with uniform external interfaces. Each entity is represented by an autonomous user agent which operates on local and migrating forms. The form concept encapsulates data, layout, and rules into a unified object which is the basic unit of presentation, processing, storage, and communication. All functionality of the system appears in rules of form classes and all data in instances of these form classes. This approach applies the techniques of computer supported cooperative work to provide a flexible mechanism for interpersonal, intraoffice, and interoffice procedures. The main challenge is to organize the collaboration without affecting the autonomy of individual user agents. In this respect, the contribution of the model is the mechanism for form migration. The dynamic integration of forms into different agents is solved with the coordinated interchange of form classes. A specific inheritance scheme provides the desired flexibility by separating the interrelated private and public form operations within each agent. The paper first describes the architecture by starting from a single agent and moving progressively towards a set of cooperating agents. Then an agent implementation called PAGES is described, experiences reported, and the open issues discussed. A typical distributed ordering procedure is used as an example throughout the text.", acknowledgement = ack-nhfb, affiliation = "Helsinki Univ of Technology", affiliationaddress = "Espoo, Finl", classification = "723", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Communications applications; Computer Architecture; Computer Supported Cooperative Work; Computer supported cooperative work; Computer Systems; Computer-communication networks; Database management; Digital--Distributed; Distr. applications; Distr. systems; Distributed Form Management; Electronic mail; Form Management; Form management; Human factors; Information systems applications; Management; Object-orientation; Office automation; Office Automation; Performance; Systems; User agent", } @Article{Watters:1990:THB, author = "Carolyn Watters and Michael A. Shepherd", title = "A Transient Hypergraph-based Model for Data Access", journal = j-TOIS, volume = "8", number = "2", pages = "77--102", month = apr, year = "1990", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:02:45 MST 1999", bibsource = "ftp://ftp.ira.uka.de/pub/bibliography/Database/Graefe.bib; http://liinwww.ira.uka.de/bibliography/Database/Graefe.html; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "Two major methods of accessing data in current database systems are querying and browsing. The more traditional query method returns an answer set that may consist of data values (DBMS), items containing the answer (full text), or items referring the user to items containing the answer (bibliographic). Browsing within a database, as best exemplified by hypertext systems, consists of viewing a database item and linking to related items on the basis of some attribute or attribute value. A model of data access has been developed that supports both query and browse access methods. The model is based on hypergraph representation of data instances. The hyperedges and nodes are manipulated through a set of operators to compose new nodes and to instantiate new links dynamically, resulting in transient hypergraphs. These transient hypergraphs are virtual structures created in response to user queries, and lasting only as long as the query session. The model provides a framework for general data access that accommodates user-directed browsing and querying, as well as traditional models of information and data retrieval, such as the Boolean, vector space, and probabilistic models. Finally, the relational database model is shown to provide a reasonable platform for the implementation of this transient hypergraph-based model of data access.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Data access model; Data items; Data manipulation; Data models; Data structures; Database management; Design; Hypertext; Inf. storage and retrieval; Information storage; Logic design; Transient hypergraphs; Virtual structures", wwwauthor = "C. Watters and M. A. Sheperd", } @Article{Moss:1990:DMP, author = "J. Eliot B. Moss", title = "Design of the {Mneme} Persistent Object Store", journal = j-TOIS, volume = "8", number = "2", pages = "103--139", month = apr, year = "1990", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:02:45 MST 1999", bibsource = "http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", wwwtitle = "Design of the Mmeme Persistent Object Store", } @Article{Shasha:1990:NTB, author = "Dennis Shasha and Tsong-Li Wang", title = "New Techniques for Best-Match Retrieval", journal = j-TOIS, volume = "8", number = "2", pages = "140--158", month = apr, year = "1990", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:02:45 MST 1999", bibsource = "ftp://ftp.ira.uka.de/pub/bibliography/Database/Graefe.bib; http://liinwww.ira.uka.de/bibliography/Database/Graefe.html; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "A scheme to answer best-match queries from a file containing a collection of objects is described. A best-match query is to find the objects in the file that are closest (according to some (dis)similarity measure) to a given target. Previous work [5, 33] suggests that one can reduce the number of comparisons required to achieve the desired results using the triangle inequality, starting with a data structure for the file that reflects some precomputed intrafile distances. We generalize the technique to allow the optimum use of any given set of precomputed intrafile distances. Some empirical results are presented which illustrate the effectiveness of our scheme, and its performance relative to previous algorithms.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Algorithms; Analysis of algorithms and problem complexity; Artificial intelligence; Best match; Database management; Distance metrics; File searching; Heuristics; Information search and retrieval; Information storage and retrieval; Lower bounds; Matching; Miscellaneous; Nonnumerical algorithms and problems; Performance; Query processing; Search process; Sorting and searching; Systems; Theory; Topology; Upper bounds", } @Article{Morrissey:1990:IIU, author = "J. M. Morrissey", title = "Imprecise Information and Uncertainty in Information Systems", journal = j-TOIS, volume = "8", number = "2", pages = "159--180", month = apr, year = "1990", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:02:45 MST 1999", bibsource = "ftp://ftp.ira.uka.de/pub/bibliography/Database/Graefe.bib; http://liinwww.ira.uka.de/bibliography/Database/Graefe.html; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "Information systems exist to model, store, and retrieve all types of data. Problems arise when some of the data are missing or imprecisely known or when an attribute is not applicable to a particular object. A consistent and useful treatment of such exceptions is necessary. The approach taken here is to allow any attribute value to be a regular precise value, a string denoting that the value is missing, a string denoting that the attribute is not applicable, or an imprecise value. The imprecise values introduce uncertainty into query evaluation, since it is no longer obvious which objects should be retrieved. To handle the uncertainty, two set of objects are retrieved in response to every query: the set of objects that are known to satisfy with complete certainty and the set that possibly satisfies the query with various degrees of uncertainty. Two methods of estimating this uncertainty, based on information theory, are proposed. The measure of uncertainty is used to rank objects for presentation to a user.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Database management; Design; Incomplete information; Inf. theory; Management; Models and principles; Null values; Query evaluation; Query processing; Sys. and information theory; Systems; Uncertainty", } @Article{Hartson:1990:UUO, author = "H. Rex Hartson and Antonio C. Siochi and Deborah Hix", title = "The {UAN}: a User-Oriented Representation for Direct Manipulation Interface Designs", journal = j-TOIS, volume = "8", number = "3", pages = "181--203", month = jul, year = "1990", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:02:45 MST 1999", bibsource = "ftp://ftp.ira.uka.de/pub/bibliography/Database/Graefe.bib; http://liinwww.ira.uka.de/bibliography/Database/Graefe.html; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "Many existing interface representation techniques, especially those associated with UIMS, are constructional and focused on interface implementation, and therefore do not adequately support a user-centered focus. But it is in the behavioral domain of the user that interface designers and evaluators do their work. We are seeking to complement constructional methods by providing a tool-supported technique capable of specifying the behavioral aspects of an interactive system-the tasks and the actions a user performs to accomplish those tasks. In particular, this paper is a practical introduction to use of the User Action Notation (UAN), a task- and user-oriented notation for behavioral representation of asynchronous, direct manipulation interface designs. Interfaces are specified in UAN as a quasihierarchy of asynchronous tasks. At the lower levels, user actions are associated with feedback and system state changes. The notation makes use of visually onomatopoeic symbols and is simple enough to read with little instruction. UAN is being used by growing numbers of interface developers and researchers. In addition to its design role, current research is investigating how UAN can support production and maintenance of code and documentation.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Behavioral design; Constructional design; Design; Human factors; Human-computer interface; Languages; Representation; Representation of interfaces; Requirements/specifications; Software engineering; Task analysis; Tools and techniques; User interface; User interfaces", } @Article{Wiecha:1990:TRD, author = "Charles Wiecha and William Bennett and Stephen Boies and John Gould and Sharon Greene", title = "{ITS}: a Tool for Rapidly Developing Interactive Applications", journal = j-TOIS, volume = "8", number = "3", pages = "204--236", month = jul, year = "1990", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:02:45 MST 1999", bibsource = "ftp://ftp.ira.uka.de/pub/bibliography/Database/Graefe.bib; http://liinwww.ira.uka.de/bibliography/Database/Graefe.html; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "The ITS architecture separates applications into four layers. The action layer implements back-end application functions. The dialog layer defines the content of the user interface, independent of its style. Content specifies the objects included in each frame of the interface, the flow of control among frames, and what actions are associated with each object. The style rule layer defines the presentation and behavior of a family of interaction techniques. Finally, the style program layer implements primitive toolkit objects that are composed by the rule layer into complete interaction techniques. This paper describes the architecture in detail, compares it with previous User Interface Management Systems and toolkits, and describes how ITS is being used to implement the visitor information system for EXPO'92.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Computer graphics; Design; Device independence; Ergonomics; General; Human factors; Information systems applications; Interaction techniques; Languages; Management; Management of computing and information systems; Management systems; Methodology and techniques; Models and principles; Project and people management; Software development; Software engineering; Software libraries; Software maintenance; Software management; Standardization; Systems analysis and design; Systems development; Tools and techniques; User interface; User interfaces; User/machine systems", } @Article{Vlissides:1990:UFB, author = "John M. Vlissides and Mark A. Linton", title = "{Unidraw}: a Framework for Building Domain-Specific Graphical Editors", journal = j-TOIS, volume = "8", number = "3", pages = "237--268", month = jul, year = "1990", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:02:45 MST 1999", bibsource = "ftp://ftp.ira.uka.de/pub/bibliography/Database/Graefe.bib; http://liinwww.ira.uka.de/bibliography/Database/Graefe.html; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "Unidraw is a framework for creating graphical editors in domains such as technical and artistic drawing, music composition, and circuit design. The Unidraw architecture simplifies the construction of these editors by providing programming abstractions that are common across domains. Unidraw defines four basic abstractions: components encapsulate the appearance and behavior of objects, tools support direct manipulation of components, commands define operations on components, and external representations define the mapping between components and the file format generated by the editor. Unidraw also supports multiple views, graphical connectivity, and dataflow between components. This paper describes the Unidraw design, implementation issues, and three experimental domain-specific editors we have developed with Unidraw: a drawing editor, a user interface builder, and a schematic capture system. Our results indicate a substantial reduction in implementation time and effort compared with existing tools.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Application packages; Computer applications; Computer graphics; Computer-aided design (CAD); Computer-aided engineering; Design; Direct manipulation user interfaces; Graphical constraints; Graphics utilities; Human factors; Object-oriented graphical editors; Software engineering; Software libraries; Tools and techniques; User interfaces", } @Article{Hudson:1990:ISF, author = "Scott E. Hudson and Shamim P. Mohamed", title = "Interactive Specification of Flexible User Interface Displays", journal = j-TOIS, volume = "8", number = "3", pages = "269--288", month = jul, year = "1990", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:02:45 MST 1999", bibsource = "ftp://ftp.ira.uka.de/pub/bibliography/Database/Graefe.bib; http://liinwww.ira.uka.de/bibliography/Database/Graefe.html; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "One of the problems with conventional UIMSs is that very often there is no graphical way to specify interfaces. This paper describes OPUS, the user interface editor of the Penguims UIMS. This system allows the presentation component of graphical user interfaces to be specified interactively in a graphical notation without explicit programming. The Penguims UIMS supports an underlying model of computation based loosely on spreadsheets. In particular, it supports incremental computations based on a system of equations (one-way constraints) over a set of named values (spreadsheet cells). These equations are used to provide immediate feedback at all levels of the interface. They are used to incrementally determine the position and dynamic appearance of the individual interactor objects that make up the interface. They are also used to connect the presentation directly to underlying application data thereby supporting semantic feedback. The OPUS user interface editor employs a special graphical notation for specifying the presentation component of a user interface. This notation allows the power of the underlying computational model to be expressed simply and quickly. The resulting presentations are very flexible in nature. They can automatically respond to changes in the size and position of display objects and can directly support derivation of their appearance from application data objects.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Computer graphics; Constraint systems; Direct manipulation; End-user programming; Human factors; Interactive; Interface builders; Languages; Methodology and techniques; Miscellaneous; Programming environments; Rapid prototyping; Software engineering; Tools and techniques; User interface management systems; User interfaces", } @Article{Myers:1990:NMH, author = "Brad A. Myers", title = "A New Model for Handling Input", journal = j-TOIS, volume = "8", number = "3", pages = "289--320", month = jul, year = "1990", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:02:45 MST 1999", bibsource = "ftp://ftp.ira.uka.de/pub/bibliography/Database/Graefe.bib; http://liinwww.ira.uka.de/bibliography/Database/Graefe.html; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "Although there has been important progress in models and packages for the output of graphics to computer screens, there has been little change in the way that input from the mouse, keyboard, and other input devices is handled. New graphics standards are still using a fifteen-year-old model even though it is widely accepted as inadequate, and most modern window managers simply return a stream of low-level, device-dependent input events. This paper presents a new model that handles input devices for highly interactive, direct manipulation, graphical user interfaces, which could be used in future toolkits, window managers, and graphics standards. This model encapsulates interactive behaviors into a few ``Interactor'' object types. Application programs can then create instances of these Interactor objects which hide the details of the underlying window manager events. In addition, Interactors allow a clean separation between the input handling, the graphics, and the application programs. This model has been extensively used as part of the Garnet system and has proven to be convenient, efficient, and easy to learn.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Computer graphics; Direct manipulation; Human factors; Input devices; Interaction; Interaction techniques; Methodology and techniques; Model-view controller; Object-oriented design; Software engineering; Tools and techniques; User interface management systems; User interfaces", } @Article{Mylopoulos:1990:TRK, author = "John Mylopoulos and Alex Borgida and Matthias Jarke and Manolis Koubarakis", title = "Telos: Representing Knowledge About Information Systems", journal = j-TOIS, volume = "8", number = "4", pages = "325--362", month = oct, year = "1990", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:02:45 MST 1999", bibsource = "ftp://ftp.ira.uka.de/pub/bibliography/Database/Graefe.bib; http://liinwww.ira.uka.de/bibliography/Database/Graefe.html; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "We describe Telos, a language intended to support the development of information systems. The design principles for the language are based on the premise that information system development is knowledge intensive and that the primary responsibility of any language intended for the task is to be able to formally represent the relevant knowledge. Accordingly, the proposed language is founded on concepts from knowledge representation. Indeed, the language is appropriate for representing knowledge about a variety of worlds related to an information system, such as the subject world (application domain), the usage world (user models, environments), the system world (software requirements, design), and the development world (teams, methodologies). We introduce the features of the language through examples, focusing on those provided for describing metaconcepts that can then be used to describe knowledge relevant to a particular information system. Telos' features include an object-centered framework which supports aggregation, generalization, and classification; a novel treatment of attributes; an explicit representation of time; and facilities for specifying integrity constraints and deductive rules. We review actual applications of the language through further examples, and we sketch a formalization of the language.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Artificial intelligence; Belief time; Class; Deductive rules; Design; General; History time; Instance; Integrity constraints; Knowledge base; Knowledge representation formalisms and methods; Languages; Management of computing and information systems; Metaclass; Methodologies; Models and principles; Predicate logic; Proposition; Representation; Representation languages; Requirements/specifications; Semantic networks; Software development; Software engineering; Software management; Temporal knowledge", wwwpages = "363--386", wwwtitle = "{Telos}: a Language for Representing Knowledge About Information Systems", } @Article{Kwok:1990:ECT, author = "K. L. Kwok", title = "Experiments with a Component Theory of Probabilistic Information Retrieval Based on Single Terms as Document Components", journal = j-TOIS, volume = "8", number = "4", pages = "363--386", month = oct, year = "1990", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:02:45 MST 1999", bibsource = "ftp://ftp.ira.uka.de/pub/bibliography/Database/Graefe.bib; http://liinwww.ira.uka.de/bibliography/Database/Graefe.html; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "A component theory of information retrieval using single content terms as component for queries and documents was reviewed and experimented with. The theory has the advantages of being able to (1) bootstrap itself, that is, define initial term weights naturally based on the fact that items are self-relevant; (2) make use of within-item term frequencies; (3) account for query-focused and document-focused indexing and retrieval strategies cooperatively; and (4) allow for component-specific feedback if such information is available. Retrieval results with four collections support the effectiveness of all the first three aspects, except for predictive retrieval. At the initial indexing stage, the retrieval theory performed much more consistently across collections than Croft's model and provided results comparable to Salton's tf*idf approach. An inverse collection term frequency (ICTF) formula was also tested that performed much better than the inverse document frequency (IDF). With full feedback retrospective retrieval, the component theory performed substantially better than Croft's, because of the highly specific nature of document-focused feedback. Repetitive retrieval results with partial relevance feedback mirrored those for the retrospective. However, for the important case of predictive retrieval using residual ranking, results were not unequivocal.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Content analysis and indexing; Document-focused and query-focused relevance feedback; Experimentation; Indexing and retrieval; Indexing methods; Inf. storage and retrieval; Information search and retrieval; Information storage and retrieval; Inverse collection term frequency weighting; Inverse document frequency weighting; Probabilistic indexing; Probabilistic retrieval; Ranking and weighting of composite objects; Retrieval models; Theory", wwwpages = "325-362", } @Article{Straube:1990:QQP, author = "Dave D. Straube and M. Tamer {\"O}zsu", title = "Queries and Query Processing in Object-Oriented Database Systems", journal = j-TOIS, volume = "8", number = "4", pages = "387--430", month = oct, year = "1990", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:02:45 MST 1999", bibsource = "ftp://ftp.ira.uka.de/pub/bibliography/Database/Graefe.bib; http://liinwww.ira.uka.de/bibliography/Database/Graefe.html; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "Object-oriented database management systems (OODBMS) combine the data abstraction and computational models of object-oriented programming languages with the query and performance capabilities of database management systems. A concise, formal data model for OODBMS has not been universally accepted, preventing detailed investigation of various system issues such as query processing. We define a data model that captures the essence of classification-based object-oriented systems and formalize concepts such as object identity, inheritance, and methods. The main topic of the paper is the presentation of a query processing methodology complete with an object calculus and a closed object algebra. Query processing issues such as query safety and object calculus to object algebra translation are discussed in detail. The paper concludes with a discussion of equivalence-preserving transformation rules for object algebra expressions.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Abstract data types; Algorithms; Data models; Data types and structures; Database management; Design; Language constructs; Languages; Logical design; Modules and packages; Object algebra; Object calculus; Object-oriented databases; Programming languages; Query languages; Query processing; Query transformation rules; Systems", wwwauthor = "D. D. Straube and M. T. Ozsu", wwwpages = "387-428", wwwtitle = "Queriers and Query Processing in Object-Oriented Database Systems", } @Article{Ford:1991:OPH, author = "Daniel Alexander Ford and Stavros Christodoulakis", title = "Optimal Placement of High Probability Randomly Retrieved Blocks on {CLV} Optical Discs", journal = j-TOIS, volume = "9", number = "1", pages = "1--30", month = jan, year = "1991", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:02:45 MST 1999", bibsource = "ftp://ftp.ira.uka.de/pub/bibliography/Database/Graefe.bib; http://liinwww.ira.uka.de/bibliography/Database/Graefe.html; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "Optimal data placement on a CLV (Constant Linear Velocity) format optical disc has as an objective the minimization of the expected access cost of data retrieval from the disc when the probabilities of access of data items may be different. The problem of optimal data placement for optical discs is both more important and more difficult than the corresponding problem on magnetic disks. A good data placement on optical discs is more important because data sets on optical discs such as WORM and CD ROM cannot be modified or moved once they are placed on the disc. Currently, even rewritable optical discs are best suited for applications that are archival in nature. The problem of optimal data placement on CLV format optical discs is more difficult, mainly because the useful storage space is not uniformly distributed across the disc surface (along a radius). This leads to a complicated positional performance trade-off not present for magnetic disks. We present a model that encompasses all the important aspects of the placement problem on CLV format optical discs. The model takes into account the nonuniform distribution of useful storage, the dependency of the rotational delay on disc position, a parameterized seek cost function for optical discs, and the varying access probabilities of data items. We show that the optimal placement of high-probability blocks satisfies a unimodality property. Based on this observation, we solve the optimal placement problem. We then study the impact of the relative weights of the problem parameters and show that the optimal data placement may be very different from the optimal data placement on magnetic disks. We also validate our model and analysis and give an algorithm for computing the placement of disc sectors.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Access methods; CD-ROM; Clustering; CLV; Constant linear velocity; Data placement; Database management; Design; Design styles; Information search and retrieval; Information storage and retrieval; Management; Mass storage; MCAV; MCLV; Memory structures; Operating systems; Optical discs; Optical disks; Performance; Physical database design; Physical design; Retrieval performance; Secondary storage devices; Storage management", wwwauthor = "S. Christodoulakis and D. A. Ford", } @Article{Kim:1991:DOO, author = "Won Kim and Nat Ballou and Jorge F. Garza and Darrell Woelk", title = "A Distributed Object-Oriented Database System Supporting Shared and Private Databases", journal = j-TOIS, volume = "9", number = "1", pages = "31--51", month = jan, year = "1991", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:02:45 MST 1999", bibsource = "ftp://ftp.ira.uka.de/pub/bibliography/Database/Graefe.bib; http://liinwww.ira.uka.de/bibliography/Database/Graefe.html; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "ORION-2 is a commercially available, federated, object-oriented database management system designed and implemented at MCC. One major architectural innovation in ORION-2 is the coexistence of a shared database and a number of private databases. The shared database is accessible to all authorized users of the system, while each private database is accessible to only the user who owns it. A distributed database system with a shared database and private databases for individual users is a natural architecture for data-intensive application environments on a network of workstations, notably computer-aided design and engineering systems. This paper discusses the benefits and limitations of such a system and explores the impact of such an architecture on the semantics and implementation of some of the key functions of a database system, notably queries, database schema, and versions. Although the issues are discussed in the context of an object-oriented data model, the results (at least significant portions thereof) are applicable to database systems supporting other data models.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Client-server architecture; Database management; Design; Distr. systems; Experimentation; Federated databases; Object-oriented databases; Sys.", wwwauthor = "W. Kim and N. Ballou and J. F. Garza and D. Woelk", } @Article{Mak:1991:EPP, author = "Victor Wing-Kit Mak and Chu Lee Kuo and Ophir Frieder", title = "Exploiting Parallelism in Pattern Matching: An Information Retrieval Application", journal = j-TOIS, volume = "9", number = "1", pages = "52--74", month = jan, year = "1991", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:02:45 MST 1999", bibsource = "ftp://ftp.ira.uka.de/pub/bibliography/Database/Graefe.bib; http://liinwww.ira.uka.de/bibliography/Database/Graefe.html; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "We propose a document-searching architecture based on high-speed hardware pattern matching to increase the throughput of an information retrieval system. We also propose a new parallel VLSI pattern-matching algorithm called the Data Parallel Pattern Matching (DPPM) algorithm, which serially broadcasts and compares the pattern to a block of data in parallel. The DPPM algorithm utilizes the high degree of integration of VLSI technology to attain very high-speed processing through parallelism. Performance of the DPPM has been evaluated both analytically and by simulation. Based on the simulation statistics and timing analysis on the hardware design, a search rate of multiple gigabytes per second is achievable using 2-$\lbrace$micro$\rbrace$m CMOS technology. The potential performance of the proposed document-searching architecture is also analyzed using the simulation statistics of the DPPM algorithm.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Algorithms; Algorithms implemented in hardware; Analysis of algorithms and problem complexity; Arithmetic and logic structures; Computer systems organization; Data; Design; Design studies; Design styles; DPPM; Files; Information search and retrieval; Information storage and retrieval; Integrated circuits; Modeling techniques; Multiple data stream architecture; Nonnumerical algorithms and problems; Parallel; Pattern matcher; Pattern matching; Performance; Performance of systems; Processor architectures; Search process; Selection process; SIMD; Sorting and searching; Sorting/searching; Types and design styles; VLSI", } @Article{Aiken:1991:IES, author = "Milam W. Aiken and Olivia R. Liu Sheng and Douglas R. Vogel", title = "Integrating Expert Systems With Group Decision Support Systems", journal = j-TOIS, volume = "9", number = "1", pages = "75--95", month = jan, year = "1991", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:02:45 MST 1999", bibsource = "ftp://ftp.ira.uka.de/pub/bibliography/Database/Graefe.bib; http://liinwww.ira.uka.de/bibliography/Database/Graefe.html; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "Expert systems are powerful tools that serve as adjuncts to decision making and have found wide applicability in a variety of areas. Integrating expert systems with group decision support systems has the potential to enhance the quality and efficiency of group communication, negotiation, and collaborative work. This paper examines possible synergies between the two technologies and provides a survey of current partially-integrated systems. Finally, a prototype design of a highly-integrated system is described with directions for further research.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Applications and expert systems; Artificial intelligence; Communications applications; Expert systems; Group decision support systems; Inf. systems applications; Knowledge-based systems", } @Article{Allen:1991:ECH, author = "Robert B. Allen", title = "Editorial: Computer-Human Interaction and {ACM TOIS}", journal = j-TOIS, volume = "9", number = "2", pages = "97--98", month = apr, year = "1991", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:02:45 MST 1999", bibsource = "http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", note = "Special Issue on Computer-Human Interaction.", URL = "http://www.acm.org:80", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Card:1991:MAD, author = "Stuart K. Card and Jock D. Mackinlay and George G. Robertson", title = "A Morphological Analysis of the Design Space of Input Devices", journal = j-TOIS, volume = "9", number = "2", pages = "99--122", month = apr, year = "1991", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:02:45 MST 1999", bibsource = "ftp://ftp.ira.uka.de/pub/bibliography/Database/Graefe.bib; http://liinwww.ira.uka.de/bibliography/Database/Graefe.html; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", note = "Special Issue on Computer-Human Interaction.", URL = "http://www.acm.org:80", abstract = "The market now contains a bewildering variety of input devices for communication from humans to computers. This paper discusses a means to systematize these devices through morphological design space analysis, in which different input device designs are taken as points in a parametrically described design space. The design space is characterized by finding methods to generate and test design points. In a previous paper, we discussed a method for generating the space of input device designs using primitive and compositional movement operators. This allowed us to propose a taxonomy of input devices. In this paper, we summarize the generation method and explore the use of device footprint and Fitts's law as a test. We then use calculations to reason about the design space. Calculations are used to show why the mouse is a more effective device than the headmouse and where in the design space there is likely to be a more effective device than the mouse.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Computer applications; Computer-aided design; Computer-aided engineering; Design; Design knowledge systematization; Design rationale; Design space; Human factors; Input devices; Models and principles; Morphological analysis; Semantics; User/machine systems", wwwtitle = "The Design Space of Input Devices", } @Article{Fischer:1991:RCC, author = "Gerhard Fischer and Andreas C. Lemke and Thomas Mastaglio and Anders I. Morch", title = "The Role of Critiquing in Cooperative Problem Solving", journal = j-TOIS, volume = "9", number = "2", pages = "123--151", month = apr, year = "1991", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:02:45 MST 1999", bibsource = "ftp://ftp.ira.uka.de/pub/bibliography/Database/Graefe.bib; http://liinwww.ira.uka.de/bibliography/Database/Graefe.html; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", note = "Special Issue on Computer-Human Interaction.", URL = "http://www.acm.org:80", abstract = "Cooperative problem-solving systems help users design solutions themselves as opposed to having solutions designed for them. Critiquing -- presenting a reasoned opinion about a user's product or action -- is a major activity of a cooperative problem-solving system. Critics make the constructed artifact ``talk back'' to the user. Conditions under which critics are more appropriate than autonomous expert systems are discussed. Critics should be embedded in integrated design environments along with other components, such as an argumentative hypertext system, a specification component, and a catalog. Critics support learning as a by-product of problem solving. The major subprocesses of critiquing are goal acquisition, product analysis, critiquing strategies, adaptation capability, explanation and argumentation, and advisory capability. The generality of the critiquing approach is demonstrated by discussing critiquing systems developed in our group and elsewhere. Limitations of many current critics include their inability to learn about specific user goals and their intervention strategies.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Computer applications; Computer uses in education; Computer-aided design; Computer-aided engineering; Computers and education; Cooperative problem-solving systems; Critics; Critiquing; Design; Design environments; High-functionality computer systems; Human factors; Inf. storage and retrieval; Information search and retrieval; Intelligent support systems; Models and principles; User/machine systems", } @Article{Jacob:1991:UEM, author = "Robert J. K. Jacob", title = "The Use of Eye Movements in Human-Computer Interaction Techniques: What You Look At Is What You Get", journal = j-TOIS, volume = "9", number = "2", pages = "152--169", month = apr, year = "1991", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:02:45 MST 1999", bibsource = "ftp://ftp.ira.uka.de/pub/bibliography/Database/Graefe.bib; http://liinwww.ira.uka.de/bibliography/Database/Graefe.html; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", note = "Special Issue on Computer-Human Interaction.", URL = "http://www.acm.org:80", abstract = "In seeking hitherto-unused methods by which users and computers can communicate, we investigate the usefulness of eye movements as a fast and convenient auxiliary user-to-computer communication mode. The barrier to exploiting this medium has not been eye-tracking technology but the study of interaction techniques that incorporate eye movements into the user-computer dialogue in a natural and unobtrusive way. This paper discusses some of the human factors and technical considerations that arise in trying to use eye movements as an input medium, describes our approach and the first eye movement-based interaction techniques that we have devised and implemented in our laboratory, and reports our experiences and observations on them.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Design; Eye movements; Eye tracking; Human factors; Human-computer interaction; Information interfaces and presentation; Input; Input devices and strategies; Interaction styles; Models and principles; Software engineering; State transition diagram; Tools and techniques; UIMS; User interface management system; User interfaces; User/machine systems", } @Article{Tang:1991:VVI, author = "John C. Tang and Scott L. Minneman", title = "{VideoDraw}: a Video Interface for Collaborative Drawing", journal = j-TOIS, volume = "9", number = "2", pages = "170--184", month = apr, year = "1991", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:02:45 MST 1999", bibsource = "ftp://ftp.ira.uka.de/pub/bibliography/Database/Graefe.bib; http://liinwww.ira.uka.de/bibliography/Database/Graefe.html; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", note = "Special Issue on Computer-Human Interaction.", URL = "http://www.acm.org:80", abstract = "This paper describes VideoDraw, a shared drawing tool, and the process by which it is being designed and developed. VideoDraw is a video-based prototype tool that provides a shared ``virtual sketchbook'' among two or more collaborators. It not only allows the collaborators to see each others' drawings, but also conveys the accompanying hand gestures and the process of creating and using those drawings. Its design stems from studying how people collaborate using shared drawing spaces. Design implications raised by those studies were embodied in a prototype, which was subsequently observed in use situations. Further research studying the use of VideoDraw (in comparison with other collaborative media) will lead to a better understanding of collaborative drawing activity and inform the continued technical development of tools to support collaborative drawing.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Collaborative systems; Communications applications; Computer graphics; Computer-communication networks; Design; Distr. applications; Distr. systems; Distributed/network graphics; Gestural interfaces; Graphics systems; Information systems applications; Shared drawing; Teleconferencing; User interface; Video technology; Work practice analysis", } @Article{Croft:1991:E, author = "W. Bruce Croft", title = "Editorial", journal = j-TOIS, volume = "9", number = "3", pages = "185--186", month = jul, year = "1991", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:02:45 MST 1999", bibsource = "http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", note = "Special Issue on Research and Development in Information Retrieval.", URL = "http://www.acm.org:80", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Turtle:1991:EIN, author = "Howard Turtle and W. Bruce Croft", title = "Evaluation of an Inference Network=based Retrieval Model", journal = j-TOIS, volume = "9", number = "3", pages = "187--222", month = jul, year = "1991", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:02:45 MST 1999", bibsource = "ftp://ftp.ira.uka.de/pub/bibliography/Database/Graefe.bib; http://liinwww.ira.uka.de/bibliography/Database/Graefe.html; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", note = "Special Issue on Research and Development in Information Retrieval.", URL = "http://www.acm.org:80", abstract = "The use of inference networks to support document retrieval is introduced. A network-based retrieval model is described and compared to conventional probabilistic and Boolean models. The performance of a retrieval system based on the inference network model is evaluated and compared to performance with conventional retrieval models.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Document retrieval; Experimentation; General; Inf. storage and retrieval; Inference networks; Information search and retrieval; Information storage and retrieval; Miscellaneous; Network retrieval models; Performance; Retrieval models; Theory", } @Article{Fuhr:1991:PLA, author = "Norbert Fuhr and Chris Buckley", title = "A Probabilistic Learning Approach for Document Indexing", journal = j-TOIS, volume = "9", number = "3", pages = "223--248", month = jul, year = "1991", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:02:45 MST 1999", bibsource = "ftp://ftp.ira.uka.de/pub/bibliography/Database/Graefe.bib; http://liinwww.ira.uka.de/bibliography/Database/Graefe.html; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", note = "Special Issue on Research and Development in Information Retrieval.", URL = "http://www.acm.org:80", abstract = "We describe a method for probabilistic document indexing using relevance feedback data that has been collected from a set of queries. Our approach is based on three new concepts: (1) Abstraction from specific terms and documents, which overcomes the restriction of limited relevance information for parameter estimation. (2) Flexibility of the representation, which allows the integration of new text analysis and knowledge-based methods in our approach as well as the consideration of document structures or different types of terms. (3) Probabilistic learning or classification methods for the estimation of the indexing weights making better use of the available relevance information. Our approach can be applied under restrictions that hold for real applications. We give experimental results for five test collections which show improvements over other methods.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Approximation; Artificial intelligence; Complex document representation; Content analysis and indexing; Experimentation; Indexing methods; Information search and retrieval; Information storage and retrieval; Learning; Least squares approximation; Linear indexing functions; Linear retrieval functions; Numerical analysis; Parameter learning; Probabilistic indexing; Probabilistic retrieval; Relevance descriptions; Retrieval models; Theory", } @Article{Gauch:1991:SIA, author = "Susan Gauch and John B. Smith", title = "Search Improvement via Automatic Query Reformulation", journal = j-TOIS, volume = "9", number = "3", pages = "249--280", month = jul, year = "1991", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:02:45 MST 1999", bibsource = "ftp://ftp.ira.uka.de/pub/bibliography/Database/Graefe.bib; http://liinwww.ira.uka.de/bibliography/Database/Graefe.html; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", note = "Special Issue on Research and Development in Information Retrieval.", URL = "http://www.acm.org:80", abstract = "Users of online retrieval systems experience many difficulties, particularly with search tactics. User studies have indicated that searchers use vocabulary incorrectly and do not take full advantage of iteration to improve their queries. To address these problems, an expert system for online search assistance was developed. This prototype augments the searching capabilities of novice users by providing automatic query reformulation to improve the search results, and automatic ranking of the retrieved passages to speed the identification of relevant information. Users' search performance using the expert system was compared with their search performance on their own, and their search performance using an online thesaurus. The following conclusions were reached: (1) the expert system significantly reduced the number of queries necessary to find relevant passages compared with the user searching alone or with the thesaurus. (2) The expert system produced marginally significant improvements in precision compared with the user searching on their own. There was no significant difference in the recall achieved by the three system configurations. (3) Overall, the expert system ranked relevant passages above irrelevant passages.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Applications and expert systems; Artificial intelligence; Expert systems; Full-text information retrieval; Human factors; Inf. storage and retrieval; Information search and retrieval; Models and principles; Online search assistance; Query reformulation; Search process; Textbases; User/machine system", } @Article{Fox:1991:OPM, author = "Edward A. Fox and Qi Fan Chen and Amjad M. Daoud and Lenwood S. Heath", title = "Order Preserving Minimal Perfect Hash Functions and Information Retrieval", journal = j-TOIS, volume = "9", number = "3", pages = "281--308", month = jul, year = "1991", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:02:45 MST 1999", bibsource = "http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", note = "Special Issue on Research and Development in Information Retrieval.", URL = "http://www.acm.org:80", abstract = "Rapid access to information is essential for a wide variety of retrieval systems and applications. Hashing has long been used when the fastest possible direct search is desired, but is generally not appropriate when sequential or range searches are also required. This paper describes a hashing method, developed for collections that are relatively static, that supports both direct and sequential access. The algorithms described give hash functions that are optimal in terms of time and hash table space utilization, and that preserve any a priori ordering desired. Furthermore, the resulting order-preserving minimal perfect hash functions (OPMPHFs) can be found using time and space that are linear in the number of keys involved; this is close to optimal.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Access methods; Algorithms; Content analysis and indexing; Data; Data storage representations; Database management; Dictionary structure; Experimentation; File organization; Hash table representations; Indexing; Indexing methods; Information storage; Information storage and retrieval; Inverted file structures; Minimal perfect hashing; Perfect hashing; Physical design; Random graph", } @Article{Siochi:1991:CAU, author = "Antonio C. Siochi and Roger W. Ehrich", title = "Computer Analysis of User Interfaces Based on Repetition in Transcripts of User Sessions", journal = j-TOIS, volume = "9", number = "4", pages = "309--335", month = oct, year = "1991", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:02:45 MST 1999", bibsource = "ftp://ftp.ira.uka.de/pub/bibliography/Database/Graefe.bib; http://liinwww.ira.uka.de/bibliography/Database/Graefe.html; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "It is generally acknowledged that the production of quality user interfaces requires a thorough understanding of the user and that this involves evaluating the interface by observing the user working with the system, or by performing human factors experiments. Such methods traditionally involve the use of videotape, protocol analysis, critical incident analysis, etc. These methods require time consuming analyses and may be invasive. In addition, the data obtained through such methods represent a relatively small portion of the use of a system. An alternative approach is to record all user input and system output (i.e., log the user session). Such transcripts can be collected automatically and noninvasively over a long period of time. Unfortunately this produces voluminous amounts of data. There is therefore a need for tools and techniques that allow an evaluator to identify potential performance and usability problems from such data. It is hypothesized that repetition of user actions is an important indicator of potential user interface problems. This research reports on the use of the repetition indicator as a means of studying user session transcripts in the evaluation of user interfaces. The paper discusses the interactive tool constructed, the results of an extensive application of the technique in the evaluation of a large image-processing system, and extensions and refinements to the technique. Evidence suggests that the hypothesis is justified and that such a technique is convincingly useful.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Evaluation/methodology; Human factors; Inf. interfaces and presentation; Maximal repeating patterns; Measurement; Repeated usage patterns; Software engineering; Tools and techniques; Transcript analysis; Usability; User interface evaluation; User interface management systems; User interfaces", } @Article{Zezula:1991:DPS, author = "P. Zezula and F. Rabitti and P. Tiberio", title = "Dynamic Partitioning of Signature Files", journal = j-TOIS, volume = "9", number = "4", pages = "336--369", month = oct, year = "1991", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:02:45 MST 1999", bibsource = "ftp://ftp.ira.uka.de/pub/bibliography/Database/Graefe.bib; http://liinwww.ira.uka.de/bibliography/Database/Graefe.html; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "The signature file access method has proved to be a convenient indexing technique, in particular for text data. Because it can deal with unformatted data, many application domains have shown interest in signature file techniques, e.g., office information systems, statistical and logic databases. We argue that multimedia databases should also take advantage of this method, provided convenient storage structures for organizing signature files are available. Our main concern here is the dynamic organization of signatures based on a partitioning paradigm called Quick Filter. A signature file is partitioned by a hashing function and the partitions are organized by linear hashing. Thorough performance evaluation of the new scheme is provided, and it is compared with single-level and multilevel storage structures. Results show that quick filter is economical in space and very convenient for applications dealing with large files of dynamic data, and where user queries result in signatures with high weights. These characteristics are particularly interesting for multimedia databases, where integrated access to attributes, text and images must be provided.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Access methods; Data; Database management; Design; Dynamic data; File organization; Files; Hashing; Information retrieval; Information storage; Information storage and retrieval; Information systems applications; Multimedia data; Office automation; Organization / structure; Performance; Performance evaluation; Physical design; Signature file partitioning", } @Article{Hart:1991:ION, author = "Paul Hart and Deborah Estrin", title = "Inter-Organization Networks, Computer Integration, and Shifts in Interdependence: The Case of the Semiconductor Industry", journal = j-TOIS, volume = "9", number = "4", pages = "370--398", month = oct, year = "1991", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:02:45 MST 1999", bibsource = "ftp://ftp.ira.uka.de/pub/bibliography/Database/Graefe.bib; http://liinwww.ira.uka.de/bibliography/Database/Graefe.html; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "Inter-organization computer networks (IONs) provide significant opportunities for improving coordination between firms engaged in mutually dependent activities. A field study of the use and impact of IONs in the semiconductor industry is presented in this paper. Eighty-two interviews were conducted in twelve firms (seven semiconductor producers and five merchant mask shops) providing data on current as well as anticipated ION use. We found that greater efficiencies are possible when IONs are used as substitutes for conventional media. But more effective ION use is achievable when internal computer integration within participating firms is implemented. The implication of this otherwise straightforward observation is that firms using computer networks only as a substitute for conventional methods of exchange will not achieve the degree of inter-organization coordination IONs can support. However, while IONs improve coordination and reduce some production and transaction costs, they simultaneously increase certain costs associated with establishing and maintaining contracts with customers. These costs are new dependencies. Dependencies emerge from using IONs to access computer resources, and information generated by those resources, located in other firms. In this way IONs increase interorganization coordination and vulnerability simultaneously. The long term implication of ION adoption is that their use shifts the nature of interdependence between participating firms.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Communications applications; Computer applications; Computer integration; Computer system implementation; Computer-communication networks; Computers and society; Computers in other systems; Consumer products; Electronic mail; Gate arrays; Information systems applications; Integrated circuits; Inter-organization computer networks; Inter-organization relationships; Management; Management of computing and information systems; Miscellaneous; Network management; Network operations; Organizational impacts; Performance; Project and people management; Standard cells; Systems development; Types and design styles", wwwpages = "399-419", wwwtitle = "Inter-Organization Networks, Computer Integration, Shift in Interdependence: The Case of the Semiconductor Industry", } @Article{Kacmar:1991:PPO, author = "Charles J. Kacmar and John J. Leggett", title = "{PROXHY}: a Process-Oriented Extensible Hypertext Architecture", journal = j-TOIS, volume = "9", number = "4", pages = "399--419", month = oct, year = "1991", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:02:45 MST 1999", bibsource = "ftp://ftp.ira.uka.de/pub/bibliography/Database/Graefe.bib; http://liinwww.ira.uka.de/bibliography/Database/Graefe.html; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "This paper describes the design and prototypical implementation of an architecture for hypertext systems which is based on the process and object-oriented models of computation. Hypertext services are provided to applications through object-based distributed processes which interact using interprocess communication facilities. By merging the process, object-oriented, and hypertext models, hypertext data and functionality can be separated from applications and distributed across a network. This architecture allows links to cross application boundaries and diverse applications to be integrated under a common hypertext model. The paper describes the architecture and application requirements for operating in this environment. PROXHY, a prototypical implementation of the architecture, is also discussed.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Computer-communication networks; Database management; Design; Distr. applications; Distr. systems; Distributed systems; Document preparation; Hypermedia system architecture; Hypertext navigation and maps; Hypertext/hypermedia; Information interfaces and presentation; Information storage and retrieval; Interactive system; Management; Multimedia information systems; Object-oriented programming; Operating systems; Organization and design; Programming techniques; Systems; Systems and software; Text processing", } @Article{Jarke:1992:DEE, author = "M. Jarke and J. Mylopoulos and J. W. Schmidt and Y. Vassiliou", title = "{DAIDA}: An Environment for Evolving Information Systems", journal = j-TOIS, volume = "10", number = "1", pages = "1--50", month = jan, year = "1992", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "We present a framework for the development of information systems based on the premise that the knowledge that influences the development process needs to somehow be captured, represented, and managed if the development process is to be rationalized. Experiences with a prototype environment developed in ESPRIT project DAIDA demonstrate the approach. The project has implemented an environment based on state-of-the-art languages for requirements modeling, design and implementation of information systems. In addition, the environment offers tools for aiding the mapping process from requirements to design and then to implementation, also for representing decisions reached during the development process. The development process itself is represented explicitly within the system, thus making the DAIDA development framework easier to comprehend, use, and modify.", acknowledgement = ack-nhfb, affiliation = "RWTH Aachen", affiliationaddress = "Aachen, Ger", classification = "723.1; 723.1.1; 723.2; 723.3; 903.3; 921", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Computational methods; Computer aided software engineering; Computer programming languages; Computer software; Computer software selection and evaluation; Conformal mapping; Data dictionary; Data structures; Database systems; Design languages; Information retrieval systems; Information science; Knowledge based systems; Management information systems; Mapping assistant; Multilevel specification; Quality assurance; Repository; Software information system; Software process model; Software quality assurance", wwwtitle = "{DAIDA}: a Knowledge-Based Environment for Developing Information Systems", } @Article{Gemmell:1992:PDS, author = "Jim Gemmell and Stavros Christodoulakis", title = "Principles of Delay Sensitive Multi-media Data Storage and Retrieval", journal = j-TOIS, volume = "10", number = "1", pages = "51--90", month = jan, year = "1992", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "This paper establishes some fundamental principles for the retrieval and storage of delay-sensitive multimedia data. Delay-sensitive data include digital audio, animations, and video. Retrieval of these data types from secondary storage has to satisfy certain time constraints in order to be acceptable to the user. The presentation is based on digital audio in order to provide intuition to the reader, although the results are applicable to all delay-sensitive data. A theoretical framework is developed for the real-time requirements of digital audio playback. We show how to describe these requirements in terms of the consumption rate of the audio data and the nature of the data-retrieval rate from secondary storage. Making use of this framework, bounds are derived for buffer space requirements for certain common retrieval scenarios. Storage placement strategies for multichannel synchronized data are then categorized and examined. The results presented in this paper are basic to any playback of delay-sensitive data and should assist the multimedia system designer in estimating hardware requirements and in evaluating possible design choices.", acknowledgement = ack-nhfb, affiliation = "Simon Fraser Univ", affiliationaddress = "Burnaby, BC, Can", classification = "716.1; 723.2; 723.3; 741.3; 752.2; 903.3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Continuous media; Data processing; Data recording; Data storage equipment; Database systems; Delay sensitive data; Digital audio playback; Digital signal processing; Image processing; Information retrieval systems; Multimedia information systems; Parameter estimation; Real time systems; Stereophonic recordings", } @Article{Want:1992:ABL, author = "Roy Want and Andy Hopper and Veronica Falcao and Jonathan Gibbons", title = "The Active Badge Location System", journal = j-TOIS, volume = "10", number = "1", pages = "91--102", month = jan, year = "1992", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "A novel system for the location of people in an office environment is described. Members of staff wear badges that transmit signals providing information about their location to a centralized location service, through a network of sensors. The paper also examines alternative location techniques, system design issues and applications, particularly relating to telephone call routing. Location systems raise concerns about the privacy of an individual, and these issues are also addressed.", acknowledgement = ack-nhfb, affiliation = "Olivetti Research Ltd", affiliationaddress = "Cambridge, Engl", classification = "716.1; 718.1; 722.3; 723.2; 723.3; 903.3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Active badges; Computer networks; Data communication equipment; Data communication systems; Database systems; Digital communication systems; Information retrieval systems; Location; Location systems; Multiplexing equipment; Office automation; Privacy issues; Security of data; Sensors; Tagging systems", } @Article{Grudin:1992:CSF, author = "Jonathan Grudin", title = "Consistency, Standards, and Formal Approaches to Interface Development and Evaluation: a Note on {Wiecha}, {Bennett}, {Boies}, {Gould}, And {Greene}", journal = j-TOIS, volume = "10", number = "1", pages = "103--111", month = jan, year = "1992", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:02:45 MST 1999", bibsource = "http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Wiecha:1992:UIC, author = "Charles Wiecha", title = "{ITS} and User Interface Consistency: a Response to {Grudin}", journal = j-TOIS, volume = "10", number = "1", pages = "112--114", month = jan, year = "1992", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:02:45 MST 1999", bibsource = "http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Krovetz:1992:LAI, author = "Robert Krovetz and W. Bruce Croft", title = "Lexical Ambiguity and Information Retrieval", journal = j-TOIS, volume = "10", number = "2", pages = "115--141", month = apr, year = "1992", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "Lexical ambiguity is a pervasive problem in natural language processing. However, little quantitative information is available about the extent of the problem or about the impact that it has on information retrieval systems. We report on an analysis of lexical ambiguity in information retrieval test collections and on experiments to determine the utility of word meanings for separating relevant from nonrelevant documents. The experiments show that there is considerable ambiguity even in a specialized database. Word senses provide a significant separation between relevant and nonrelevant documents, but several factors contribute to determining whether disambiguation will make an improvement in performance. For example, resolving lexical ambiguity was found to have little impact on retrieval effectiveness for documents that have many words in common with the query. Other uses of word sense disambiguation in an information retrieval context are discussed.", acknowledgement = ack-nhfb, affiliation = "Univ of Massachusetts", affiliationaddress = "Amherst, MA, USA", classification = "721.1; 723.2; 723.4; 903.1; 903.3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Artificial intelligence; Computational linguistics; Data processing; Disambiguation; Indexing (of information); Information retrieval systems; Lexical ambiguity; Linguistics; Natural language processing systems; Semantically based search; Terminology; Word senses", } @Article{Botafogo:1992:SAH, author = "Rodrigo A. Botafogo and Ehud Rivlin and Ben Shneiderman", title = "Structural Analysis of Hypertexts: Identifying Hierarchies and Useful Metrics", journal = j-TOIS, volume = "10", number = "2", pages = "142--180", month = apr, year = "1992", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "Hypertext users often suffer from the `lost in hyperspace' problem: disorientation from too many jumps while traversing a complex network. One solution to this problem is improved authoring to create more comprehensible structures. This paper proposes several authoring tools, based on hypertext structure analysis. In many hypertext systems authors are encouraged to create hierarchical structures, but when writing, the hierarchy is lost because of the inclusion of cross-reference links. The first part of this paper looks at ways of recovering lost hierarchies and finding new ones, offering authors different views of the same hypertext. The second part helps authors by identifying properties of the hypertext document. Multiple metrics are developed including compactness and stratum. Compactness indicates the intrinsic connectedness of the hypertext, and stratum reveals to what degree the hypertext is organized so that some nodes must be read before others. Several existing hypertexts are used to illustrate the benefits of each technique. The collection of techniques provides a multifaceted view of the hypertext, which should allow authors to reduce undesired structural complexity and create documents that readers can traverse more easily.", acknowledgement = ack-nhfb, affiliation = "Univ of Maryland", affiliationaddress = "College Park, MD, USA", classification = "461.4; 723.2; 903.3; 921", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Computer networks; Data reduction; Data structures; Graph theory; Hierarchical systems; Human engineering; Hypertext systems; Information retrieval; Man machine systems; Metrics; User interfaces", } @Article{Carroll:1992:GAT, author = "John M. Carroll and Mary Beth Rosson", title = "Getting Around the Task-Artifact Cycle: How to Make Claims and Design by Scenario", journal = j-TOIS, volume = "10", number = "2", pages = "181--212", month = apr, year = "1992", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "We are developing an `action science' approach to human-computer interaction (HCI), seeking to better integrate activities directed at understanding with those directed at design. The approach leverages development practices of current HCI with methods and concepts to support a shift toward using broad and explicit design rationale to reify where we are in a design process, why we are there, and to guide reasoning about where we might go from there. We represent a designed artifact as the set of user scenarios supported by that artifact and more finely by causal schemas detailing the underlying psychological rationale. These schemas, called claims, unpack wherefores and whys of the scenarios. In this paper, we stand back from several empirical projects to clarify our commitments and practices.", acknowledgement = ack-nhfb, affiliation = "IBM Thomas J. Watson Research Cent", affiliationaddress = "Yorktown Heights, NY, USA", classification = "461.4; 723.5; 921", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Computer aided software engineering; Design rationale; Human computer interaction (HCI); Human engineering; Man machine systems; Mathematical models; Software engineering; User interfaces", } @Article{Blake:1992:SOE, author = "G. Elizabeth Blake and Tim Bray and Frank Wm. Tompa", title = "Shortening the {OED}: {Experience} with a Grammar-Defined Database", journal = j-TOIS, volume = "10", number = "3", pages = "213--232", month = jul, year = "1992", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "Textual databases with highly variable structure can be usefully described by a grammar-defined model. One example of such a text is the Oxford English Dictionary. This paper describes a first attempt to apply technology based on this model to a real problem. A language called GOEDEL, which is a partial implementation of a set of grammar-defined database operators, was used to extract and alter a subset of the OED in order to assist the editors in their production of The Shorter Oxford English Dictionary. The implementation of the pstring data structure to describe a piece of text and the functions that operate on this pstring are illustrated with some detailed examples. The project was judged a success and the resulting program used in production by the Oxford University Press.", acknowledgement = ack-nhfb, affiliation = "Univ of Waterloo", affiliationaddress = "Waterloo, Ont, Can", classification = "721.1; 723.2; 723.3; 903.1", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Computational grammars; Computational linguistics; Data structures; Database systems; Formal languages; Goedel formal language; Grammar defined model; Oxford English Dictionary; Parsed string; Pstring data structure; Shorter Oxford English Dictionary; Terminology; Text databases", } @Article{Palaniappan:1992:EFO, author = "Murugappan Palaniappan and Nicole Yankelovich and George Fitzmaurice and Anne Loomis and Bernard Haan and James Coombs and Norman Meyrowitz", title = "The Envoy Framework: An Open Architecture for Agents", journal = j-TOIS, volume = "10", number = "3", pages = "233--264", month = jul, year = "1992", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "The Envoy Framework addresses a need for computer-based assistants or agents that operate in conjunction with users' existing applications, helping them perform tedious, repetitive, or time-consuming tasks more easily and efficiently. Envoys carry out missions for users by invoking envoy-aware applications called operatives and inform users of mission results via envoy-aware applications called informers. The distributed, open architecture developed for Envoys is derived from an analysis of the best characteristics of existing agent systems. This architecture has been designed as a model for how agent technology can be seamlessly integrated into the electronic desktop. It defines a set of application programmer's interfaces so that developers may convert their software to envoy-aware applications. A subset of the architecture described in this paper has been implemented in an Envoy Framework prototype.", acknowledgement = ack-nhfb, affiliation = "Brown Univ", affiliationaddress = "Providence, RI, USA", classification = "722.4; 723.1; 903.2; 903.3; 912.4", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Application programmer interface (api); Computer architecture; Computer software; Computer systems programming; Distributed computer systems; Distributed open architecture; Envoy Framework; Information dissemination; Information management; Information retrieval; Software engineering; User agents; User envoys; User informers; User interfaces; User operatives; Work simplification", wwwauthor = "M. Palaniappan and G. Fitzmaurice and N. Yankelovich and George Fitzmaurice and Anne Loomis and Bernard Haan and James Coombs and Norman Meyrowitz", wwwtitle = "The {Envoy} System: An Open Architecture for Agents", } @Article{Ioannidis:1992:CLD, author = "Yannis E. Ioannidis and Tomas Saulys and Andrew J. Whitsitt", title = "Conceptual Learning in Database Design", journal = j-TOIS, volume = "10", number = "3", pages = "265--293", month = jul, year = "1992", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "This paper examines the idea of incorporating machine learning algorithms into a database system for monitoring its stream of incoming queries and generating hierarchies with the most important concepts expressed in those queries. The goal is for these hierarchies to provide valuable input to the database administrator for dynamically modifying the physical and external schemas of a database for improved system performance and user productivity. The criteria for choosing the appropriate learning algorithms are analyzed, and based on them, two such algorithms, UNIMEM and COBWEB, are selected as the most suitable ones for the task. Standard UNIMEM and COBWEB implementations have been modified to support queries as input. Based on the results of experiments with these modified implementations, the whole approach appears to be quite promising, especially if the concept hierarchy from which the learning algorithms start their processing is initialized with some of the most obvious concepts captured in the database.", acknowledgement = ack-nhfb, affiliation = "Univ of Wisconsin", affiliationaddress = "Madison, WI, USA", classification = "723.1; 723.3; 723.4; 921.5", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Adaptive database systems; Adaptive systems; Algorithms; cobweb algorithm; Database schemas; Database systems; Hierarchical systems; Learning algorithms; Learning from examples; Learning systems; Optimization; Performance; Query languages; UNIMEM algorithm", wwwauthor = "Y. E. Ioannidis and T. Saulys and A. J. Whittsitt", } @Article{Rada:1992:CTH, author = "Roy Rada", title = "Converting a Textbook to Hypertext", journal = j-TOIS, volume = "10", number = "3", pages = "294--315", month = jul, year = "1992", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "Traditional documents may be transformed into hypertext by first reflecting the document's logical markup in the hypertext (producing first-order hypertext) and then by adding links not evident in the document markup (producing second-order hypertext). In our transformation of a textbook to hypertext, the textbook is placed in an intermediate form based on a semantic net and is then placed into the four hypertext systems: Emacs-Info, Guide, HyperTies, and SuperBook. The first-order Guide and SuperBook hypertexts reflect a depth-first traversal of the semantic net, and the Emacs-Info and HyperTies hypertexts reflect a breadth-first traversal. The semantic net is augmented manually, and then new traversal programs automatically generate alternate outlines. An index based on word patterns in the textbook is also automatically generated for the second-order hypertext. Our suite of programs has been applied to a published textbook, and the resulting hypertexts are publicly available.", acknowledgement = ack-nhfb, affiliation = "Univ of Liverpool", affiliationaddress = "Liverpool, Engl", classification = "461.4; 723.2; 723.5; 903.1; 903.2; 903.3; C6130D (Document processing techniques); C6160Z (Other DBMS); C7250 (Information storage and retrieval)", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Computer applications; Computer software; Data processing; Document markup; Hierarchical systems; Human computer interaction; Human engineering; Hypermedia models; Hypertext; Indexing (of information); Information dissemination; Information retrieval systems; Man machine systems; Semantic net; Software package Emacs Info; Software package Guides; Software package HyperTies; Software package Superbook; Textbooks", wwwtitle = "Converting a Text to {Guide}, {HyperTies}, and {Superbook}: Practice and Principles", } @Article{Mackinlay:1992:EUI, author = "Jock Mackinlay and Jim Rhyne", title = "Editorial: User Interface Software and Technology", journal = j-TOIS, volume = "10", number = "4", pages = "317--319", month = oct, year = "1992", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:02:45 MST 1999", bibsource = "http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Pausch:1992:LLS, author = "Randy Pausch and Matthew Conway and Robert DeLine", title = "Lessons Learned from {SUIT}, the {Simple User Interface Toolkit}", journal = j-TOIS, volume = "10", number = "4", pages = "320--344", month = oct, year = "1992", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "In recent years, the computer science community has realized the advantages of GUIs (Graphical User Interfaces). Because high-quality GUIs are difficult to build, support tools such as UIMSs, UI Toolkits, and Interface Builders have been developed. Although these tools are powerful, they typically make two assumptions: first, that the programmer has some familiarity with the GUI model, and second, that he is willing to invest several weeks becoming proficient with the tool. These tools typically operate only on specific platforms, such as DOS, the Macintosh, or UNIX/X-windows. The existing tools are beyond the reach of most undergraduate computer science majors, or professional programmers who wish to quickly build GUIs without investing the time to become specialists in GUI design. For this class of users, we developed SUIT, the Simple User Interface Toolkit. SUIT is an attempt to distill the fundamental components of an interface builder and GUI toolkit, and to explain those concepts with the tool itself, all in a short period of time. We have measured that college juniors with no previous GUI programming experience can use SUIT productively after less than three hours. SUIT is a C subroutine library which provides an external control UIMS, an interactive layout editor, and a set of standard `widgets,' such as sliders, buttons, and check boxes. SUIT-based applications run transparently across the Macintosh, DOS, and UNIX/X platforms. SUIT has been exported to hundreds of external sites on the Internet. This paper describes SUIT's architecture, the design decisions we made during its development, and the lessons we learned from extensive observations of over 120 users.", acknowledgement = ack-nhfb, affiliation = "Univ of Virginia", affiliationaddress = "Charlottesville, VA, USA", classification = "461.4; 722.4; 723.1; 723.1.1; 723.2; 723.5", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "C (programming language); Computer graphics; Computer operating systems; Computer programming; Computer science; Computer software; Computer software portability; Graphical user interfaces; Human engineering; Interactive computer systems; Learnability; Learning systems; Pedagogy; Rapid prototyping; Simple user interface toolkit (suit); Software engineering; Software tools; User interface toolkit; User interfaces", wwwauthor = "R. Pausch and M. Conway and R. Deline", } @Article{Dewan:1992:HLF, author = "Prasun Dewan and Rajiv Choudhary", title = "A High-Level and Flexible Framework for Implementing Multiuser User Interfaces", journal = j-TOIS, volume = "10", number = "4", pages = "345--380", month = oct, year = "1992", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "We have developed a high-level and flexible framework for supporting the construction of multiuser user interfaces. The framework is based on a generalized editing interaction model, which allows users to view programs as active data that can be concurrently edited by multiple users. It consists of several novel components including a refinement of both the Seeheim UIMS architecture and the distributed graphics architecture that explicitly addresses multiuser interaction; the abstractions of shared active variables and interaction variables, which allow users and applications to exchange information; a set of default collaboration rules designed to keep the collaboration-awareness low in multiuser programs; and a small but powerful set of primitives for overriding these rules. The framework allows users to be dynamically added and removed from a multiuser session, different users to use different user interfaces to interact with an application, the modules interacting with a particular user to execute on the local workstation, and programmers to incrementally trade automation for flexibility. We have implemented the framework as part of a system called Suite. This paper motivates, describes, and illustrates the framework using the concrete example of Suite, discusses how it can be implemented in other kinds of systems, compares it with related work, discusses its shortcomings, and suggests directions for future work.", acknowledgement = ack-nhfb, affiliation = "Purdue Univ", affiliationaddress = "West Lafayette, IN, USA", classification = "461.4; 722.4; 723.1.1; 723.2; 723.3; 723.5", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Administrative data processing; Computer architecture; Computer graphics; Computer networks; Computer programming languages; Computer supported cooperative work; Distributed computer systems; Distributed database systems; File editors; Flexibility; Groupware; Human engineering; Interactive computer systems; Multiprocessing systems; Multiuser user interfaces; Text editing; User interface management systems; User interfaces", wwwtitle = "Coupling the User Interfaces of a Multi-User Program", } @Article{Bier:1992:ESB, author = "Eric A. Bier", title = "{EmbeddedButtons}: Supporting Buttons in Documents", journal = j-TOIS, volume = "10", number = "4", pages = "381--407", month = oct, year = "1992", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "EmbeddedButtons is a library of routines and a runtime kernel that support the integration of buttons into document media, including text and graphics. Existing document editors can be modified to participate in this open architecture with the addition of a few simple routines. Unlike many button systems that insert special button objects into document media, this system supports turning existing document objects into buttons. As a consequence, buttons inherit all of the attributes of normal document objects, and the appearance of buttons can be edited using operations already familiar to users. Facilities are provided for linking buttons to application windows so that documents can serve as application control panels. Hence, user interface designers can lay out control panels using familiar document editors rather than special-purpose tools. Three classes of buttons have been implemented, including buttons that pop up a menu and buttons that store and display the value of a variable. New button classes, editors, and applications can be added at run time. Two editors, one for text and one for graphics, currently participate in the architecture.", acknowledgement = ack-nhfb, affiliation = "Xerox Palo Alto Research Cent", affiliationaddress = "Palo Alto, CA, USA", classification = "461.4; 722; 722.4; 723.1; 723.2", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Active documents; Computer architecture; Computer graphics; Computer software; EmbeddedButtons; File editors; Human engineering; Interaction techniques; Interactive computer systems; Man machine systems; Rapid prototyping; Software engineering; Subroutines; Text editing; User interfaces", } @Article{Matsuoka:1992:GFB, author = "Satoshi Matsuoka and Shin Takahashi and Tomihisa Kamada and Akinori Yonezawa", title = "A General Framework for Bidirectional Translation between Abstract and Pictorial Data", journal = j-TOIS, volume = "10", number = "4", pages = "408--437", month = oct, year = "1992", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "The merits of direct manipulation are now widely recognized. However, direct manipulation interfaces incur high cost in their creation. To cope with this problem, we present a model of bidirectional translation between pictures and abstract application data, and a prototype system, TRIP2, based on this model. Using this model, general mapping from abstract data to pictures and from pictures to abstract data is realized merely by giving declarative mapping rules, allowing fast and easy creation of direct manipulation interfaces. We apply the prototype system to the generation of the interfaces for kinship diagrams, Graph Editors, E-R diagrams, and an Othello game.", acknowledgement = ack-nhfb, affiliation = "Univ of Tokyo", affiliationaddress = "Tokyo, Jpn", classification = "721.1; 723.1; 723.2; 723.5; 741.3; 921", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Abstract application data; Algorithms; Bidirectional translation; Computational methods; Computer graphics; Data processing; Direct manipulation; File editors; Human engineering; Human information processing; Humanities computing; Image processing; Interactive computer systems; Mathematical models; Prototype system trip2; Software engineering; User interface management systems; User interfaces; Visualization", wwwauthor = "S. Takahashi and S. Matsuoka and A. Yonezawa and T. Kamada", wwwtitle = "A General Framework for Bi-directional Translation between Abstract and Pictorial Data", } @Article{Kataoka:1992:MIO, author = "Yutaka Kataoka and Masato Morisaki and Hiroshi Kuribayashi and Hiroyoshi Ohara", title = "A Model for Input and Output of Multilingual Text in a Windowing Environment", journal = j-TOIS, volume = "10", number = "4", pages = "438--451", month = oct, year = "1992", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "The layered multilingual input\slash output (I/O) system we designed, based on typological studies of major-language writing conventions, unifies common features of such conventions to enable international and local utilization. The internationalization layer input module converts keystroke sequences to phonograms and ideograms. The corresponding output module displays position-independent and dependent characters. The localization layer positions language-specific functions outside the structure, integrating them as tables used by finite automaton interpreters and servers to add new languages and code sets without recompilation. The I/O system generates and displays stateful and stateless code sets, enabling interactive language switching. Going beyond POSIX locale model bounds, the system generates ISO 2022, ISO\slash DIS 10646 (1990), and Compound Text, defined for the interchange encoding format in X11 protocols, for basic polyglot text communication and processing. Able to generate multilingual code sets, the I/O system clearly demonstrates that code sets should be selected by applications which have purposes beyond selecting one element from a localization set. Functionality and functions related to text manipulation in an operating system (OS) must also be determined by such applications. A subset of this I/O system was implemented in the X window system as a basic use of X11R5 I/O by supplying basic code set generation and string manipulation to eliminate OS interference. To ensure polyglot string manipulation, the I/O system must clearly be implemented separately from an OS and its limitations.", acknowledgement = ack-nhfb, affiliation = "Waseda Univ", affiliationaddress = "Tokyo, Jpn", classification = "722.4; 723.1; 723.1.1; 723.2; 902.2", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Codes (symbols); Computer operating systems; Computer programming languages; Data processing; Data structures; Encoding (symbols); Input output programs; Interactive computer systems; Internationalization; iso 2022 standard; iso/dis 10646 (1990) standard; Linguistics; Localization; Multilingual; Multiwindow; Network protocols; Polyglot text; POSIX locale code; Program interpreters; Standardization; X window systems; X11 protocols", } @Article{Garzotto:1993:HMB, author = "Franca Garzotto and Paolo Paolini and Daniel Schwabe", title = "{HDM} --- {A} Model Based Approach to Hypertext Application Design", journal = j-TOIS, volume = "11", number = "1", pages = "1--26", month = jan, year = "1993", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "Hypertext development should benefit from a systematic, structured development, especially in the case of large and complex applications. A structured approach to hypertext development suggests the notion of authoring-in-the-large. Authoring-in-the-large allows the description of overall classes of information elements and navigational structures of complex applications without much concern with implementation details, and in a system-independent manner. The paper presents HDM (Hypertext Design Model), a first step towards defining a general purpose model for authoring-in-the-large. Some of the most innovative features of HDM are: the notion of perspective; the identification of different categories of links (structural links, application links, and perspective links) with different representational roles; the distinction between hyperbase and access structures; and the possibility of easily integrating the structure of a hypertext application with its browsing semantics. HDM can be used in different manners: as a modeling device or as an implementation device. As a modeling device, it supports producing high level specifications of existing or to-be-developed applications. As an implementation device, it is the basis for designing tools that directly support application development. One of the central advantages of HDM in the design and practical construction of hypertext applications is that the definition of a significant number of links can be derived automatically from a conceptual-design level description. Examples of usage of HDM are also included.", acknowledgement = ack-nhfb, affiliation = "Politecnico di Milano", classification = "723.3; 903.3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Data models; Database systems; Hypertext; Information retrieval systems; Office automation", } @Article{Schnase:1993:SDM, author = "John L. Schnase and John J. Leggett and David L. Hicks and Ron L. Szabo", title = "Semantic Data Modeling of Hypermedia Associations", journal = j-TOIS, volume = "11", number = "1", pages = "27--50", month = jan, year = "1993", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "Many important issues in the design and implementation of hypermedia system functionality focus on the way interobject connections are represented, manipulated, and stored. A prototypic system called HB1 is being designed to meet the storage needs of next-generation hypermedia system architectures. HB1 is referred to as a hyperbase management systems (HBMS) because it supports, not only the storage and manipulation of information, but the storage and manipulation of the connectivity data that link information together to form hypermedia. Among HB1's distinctions is its use of a semantic network database system to manage physical storage. Here, basic semantic modeling concepts as they apply to hypermedia systems are reviewed, and experiences using a semantic database system in HB1 are discussed. Semantic data models attempt to provide more powerful mechanisms for structuring objects than are provided by traditional approaches. In HB1, it was necessary to abstract interobject connectivity, behaviors, and information for hypermedia. Building on top pf a semantic database system facilitated such a separation and made the structural aspects of hypermedia conveniently accessible to manipulation. This becomes particularly important in the implementation of structure-related operations such as structural queries. Our experience suggests that an intergrated semantic object-oriented database paradigm appears to be superior to purely relational, semantic, or object-oriented methodologies for representing the structurally complex interrelationships that arise in hypermedia.", acknowledgement = ack-nhfb, affiliation = "CRSS Architects, Inc", classification = "723.1; 723.3; 903.3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Data models; Database systems; Information retrieval systems; Management information systems; Object oriented programming", } @Article{Rama:1993:ICR, author = "D. V. Rama and Padmini Srinivasan", title = "An Investigation of Content Representation Using Text Grammars", journal = j-TOIS, volume = "11", number = "1", pages = "51--75", month = jan, year = "1993", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "We extend prior work on a model for natural language text representation and retrieval using a linguistic device called text grammar. We demonstrate the value of this approach in accessing relevant items from a collection of empirical abstracts in a medical domain. The advantage, when compared to traditional keyword retrieval, is that this approach is a significant move towards knowledge representation and retrieval. Text representation in this model includes keywords and their conceptual roles in the text. In particular, it involves extracting TOPIC predicates representing the research issue addressed and DESIGN predicates representing important methodological features of the empirical study. Preliminary experimentation shows that keywords exhibit a variety of text-grammar roles in a test database. Second, as intuitively expected, retrieval using TOPIC predicates identifies a smaller subset of texts than Boolean retrieval does. These empirical results along with the theoretical work indicate that the representation and retrieval strategies proposed have a significant potential. Finally, EMPIRICIST,a prototype system, is described. In it the text representation predicates are implemented as a network while retrieval is through constrained-spreading activation strategies.", acknowledgement = ack-nhfb, affiliation = "Bentley Coll", classification = "723.5; 903.1; 903.3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Indexing (of information); Information retrieval systems; Natural language processing systems; Text analysis", } @Article{Szczur:1993:TPT, author = "Martha R. Szczur and Sylvia B. Sheppard", title = "{TAE} Plus: Transportable Applications Environment Plus: a User Interface Development Environment", journal = j-TOIS, volume = "11", number = "1", pages = "76--101", month = jan, year = "1993", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "The Transportable Applications Environment Plus (TAE Plus${}^{TM}$) is a NASA-developed user interface development environment (UIDE) for the rapid prototyping, evaluation, implementation, and management of user interfaces. TAE Plus provides an intuitive What You see Is What You Get (WYSIWYG) WorkBench for designing an application's user interface. The WorkBench supports the creation and sequencing of displays, including real-time, data-driven display objects. Users can define context-sensitive help for a target application. They can rehearse the user interface and also generate code automatically. In addition, TAE Plus contains application services for the runtime manipulation and management of the user interface. Based on Motif${}^{TM}$ and the MIT X Window System${}^{TM}$, TAE Plus runs on a variety of Unix-or VMS-based workstations. TAE Plus is an evolving system. User-defined requirements and new technology guide the development of each new version. Advances in virtual operating systems, human factors, computer graphics, command language design, standardization, and software portability are monitored and incorporated as they become available.", acknowledgement = ack-nhfb, affiliation = "NASA", classification = "461.4; 723.5", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Human engineering; Interfaces (computer); Prototyping; Software development; Software engineering; User interfaces", wwwauthor = "M. R. Szezur and S. B. Sheppard", wwwtitle = "{TAE Plus: Transportable Applications Environment Plus}", } @Article{King:1993:DDI, author = "Roger King and Michael Novak", title = "Designing Database Interfaces with {DBface}", journal = j-TOIS, volume = "11", number = "2", pages = "105--132", month = apr, year = "1993", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "DBface is a toolkit for designing interfaces to object-oriented databases. It provides users with a set of tools for building custom interfaces with minimal programming. This is accomplished by combining techniques from User Interface Management Systems (UIMS) with a built-in knowledge about the specific kinds of techniques used by object-oriented databases. DBface allows users to create graphical constructs and interactive techniques by taking advantage of an object-oriented database environment and tools. Not only can database tools be used for creating an interface, but information about the interface being built is stored within a database schema and is syntactically consistent with all other schema information. Thus, an interface can deal with data and schema information, including information about another interface. This allows for easy reusability of graphical constructs such as data representations.", acknowledgement = ack-nhfb, affiliation = "Univ of Colorado", classification = "722; 723.1; 723.3; 723.4.1", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Computer programming; Database interfaces; Database systems; Graphical interfaces; Interactive computer graphics; Interfaces (computer); Knowledge based systems; Object-oriented databases; User interfaces", } @Article{Ciaccia:1993:EAP, author = "Paulo Ciaccia and Pavel Zezula", title = "Estimating Accesses in Partitioned Signature File Organizations", journal = j-TOIS, volume = "11", number = "2", pages = "133--142", month = apr, year = "1993", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "We show that performance of some basic methods for the partitioning of signature files, namely Quick Filter and Fixed Prefix, can be easily evaluated by means of a closed formula. The approximation is based on well-known results from probability theory, and, as shown by simulations, introduces no appreciable errors when compared with the exact, cumbersome formulas used so far. Furthermore, we prove that the exact formulas for the two methods coincide. Although this does not imply that the two methods behave in the same way, it sheds light on the way they could be compared.", acknowledgement = ack-nhfb, affiliation = "Univ of Bologna", affiliationaddress = "Italy", classification = "721.1; 723.5; 903.3; 922.1", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Access estimation; Codes (symbols); Computer simulation; File organization; Information retrieval; Partitioned signature files; Probability; Probability theory; Signature files", wwwauthor = "P. Zezula and P. Ciaccia", } @Article{Can:1993:ICD, author = "Fazli Can", title = "Incremental Clustering for Dynamic Information Processing", journal = j-TOIS, volume = "11", number = "2", pages = "143--164", month = apr, year = "1993", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "Clustering of very large document databases is useful for both searching and browsing. The periodic updating of clusters is required due to the dynamic nature of databases. An algorithm for incremental clustering is introduced. The complexity and cost analysis of the algorithm together with an investigation of its expected behavior are presented. Through empirical testing it is shown that the algorithm achieves cost effectiveness and generates statistically valid clusters that are compatible with those of reclustering. The experimental evidence shows that the algorithm creates an effective and efficient retrieval environment.", acknowledgement = ack-nhfb, affiliation = "Miami Univ", classification = "723.2; 723.3; 903.3; 911.1; 922.2", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Algorithms; Browsing; Clustering; Cost accounting; Cost effectiveness; Data processing; Database systems; Document databases; Dynamic information processing; Incremental clustering; Information retrieval; Statistical methods; Statistically valid clusters", } @Article{Bansler:1993:RSA, author = "J{\o}rgen P. Bansler and Keld B{\o}dker", title = "A Reappraisal of Structured Analysis: Design in an Organizational Context", journal = j-TOIS, volume = "11", number = "2", pages = "165--193", month = apr, year = "1993", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "We review Structured Analysis as presented by Yourdon and DeMarco. First, we examine the implicit assumptions embodied in the method about the nature of organizations, work processes, and design. Following this we present the results of an exploratory study, conducted to find out how the method is applied in practice. This study reveals that while some of the tools of Structured Analysis --- notably the data flow diagram --- are used and combined with other tools, the designers do not follow the analysis and design procedures prescribed by the method. Our findings suggest that there is a gap between the way systems development is portrayed in the normative technical literature and the way in which is carried out.", acknowledgement = ack-nhfb, affiliation = "Univ of Copenhagen", classification = "721.1; 723.1; 723.2", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Computer programming; Computer software; Data flow diagrams; Data processing; Structured analysis; Structured programming; Work processes", wwwtitle = "A Reappraisal of Structured Analysis", } @Article{Feiner:1993:EVW, author = "Steven K. Feiner and Simon J. Gibbs", title = "Editorial: Virtual Worlds", journal = j-TOIS, volume = "11", number = "3", pages = "195--196", month = jul, year = "1993", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:02:45 MST 1999", bibsource = "http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", note = "Special Issue on Virtual Worlds.", URL = "http://www.acm.org:80", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Fitzmaurice:1993:VRP, author = "George W. Fitzmaurice and Shumin Zhai and Mark H. Chignell", title = "Virtual Reality for Palmtop Computers", journal = j-TOIS, volume = "11", number = "3", pages = "197--218", month = jul, year = "1993", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", note = "Special Issue on Virtual Worlds.", URL = "http://www.acm.org:80", abstract = "We are exploring how virtual reality theories can be applied toward palmtop computers, In our prototype, called the Cameleon, a small 4-inch hand-held monitor acts as a palmtop computer with the capabilities of a Silicon graphics workstation. A 6D input device and a response button are attached to the small monitor to detect user gestures and input selections for issuing commands. An experiment was conducted to evaluate our design and to see how well depth could be perceived in the small screen compared to a large 21-inch screen, and the extent to which movement of the small display ( in a palmtop virtual reality condition) could improve depth perception.", acknowledgement = ack-nhfb, affiliation = "Univ of Toronto", affiliationaddress = "Can", classification = "723", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Computer workstations; Computers; Depth perception improvement; Palmtop virtual reality condition; Silicon graphics workstation; Virtual reality theories; Virtual storage", } @Article{Sturman:1993:DMW, author = "David J. Sturman and David Zeltzer", title = "A Design Method for ``Whole Hand'' Human-Computer Interaction", journal = j-TOIS, volume = "11", number = "3", pages = "219--238", month = jul, year = "1993", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", note = "Special Issue on Virtual Worlds.", URL = "http://www.acm.org:80", abstract = "A disciplined investigation of whole-hand interfaces (often glove based, currently) and their appropriate use for the control of complex task domains by the design method for whole-hand input. This is a series of procedures --- including a common basis for the description, design, and evaluation of whole-hand input, together with an accompanying taxonomy --- that enumerates key issues and points for consideration in the development of whole-hand input. The method helps designers focus on task requirements, isolate problem areas, and choose appropriate whole-hand input strategies for their specified tasks.", acknowledgement = ack-nhfb, affiliation = "Massachusetts Inst of Technology", affiliationaddress = "Cambridge, MA, USA", classification = "723; 723.4", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Computer graphics; Computers; Input devices; Interaction techniques; Man machine systems; Virtual environments; Whole hand human computer interaction", } @Article{Arthur:1993:ETP, author = "Kevin W. Arthur and Kellogg S. Booth and Colin Ware", title = "Evaluating {3D} Task Performance for Fish Tank Virtual Worlds", journal = j-TOIS, volume = "11", number = "3", pages = "239--265", month = jul, year = "1993", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", note = "Special Issue on Virtual Worlds.", URL = "http://www.acm.org:80", abstract = "'Fish tank virtual reality' refers to the use of a standard graphics workstation to achieve real-time display of 3D scenes using stereopsis and dynamic head-coupled perspective. Fish tank VR has a number of advantages over head-mounted immersion VR which makes it more practical for many applications. After discussing the characteristics of fish tank VR, we describe a set of three experiments conducted to study the benefits of fish tank VR over a traditional workstation graphics display. These experiments tested user performance under two conditions: (a) whether or not stereoscopic display was used and (b) whether or not the perspective display was coupled dynamically to the positions of a user's eyes. Subjects using a comparison protocol consistently preferred head coupling without stereo over stereo without head coupling.", acknowledgement = ack-nhfb, affiliation = "Univ of British Columbia", affiliationaddress = "Can", classification = "723; 723.4", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Computer graphics; Computer workstations; Computers; Fish tank virtual worlds; Head-coupled display; Standard graphics workstation; Three-dimensional graphics; Virtual storage; Virtual worlds", wwwauthor = "K. Arthur and K. Booth and C. Ware", } @Article{Koike:1993:RAS, author = "Hideki Koike", title = "The Role of Another Spatial Dimension in Software Visualization", journal = j-TOIS, volume = "11", number = "3", pages = "266--286", month = jul, year = "1993", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", note = "Special Issue on Virtual Worlds.", URL = "http://www.acm.org:80", abstract = "The primary objective of this article is to demonstrate the use of 3D-computer graphics in visualizing shapeless software information by focusing on performance monitoring of parallel-concurrent computer systems. Issues are addressed from two different perspectives: expressiveness of output media and user cognition. The former describes the limitations of 2D output media. The latter refers to a user's cognitive load when using 2D representations in a multiple-window environment.", acknowledgement = ack-nhfb, affiliation = "Univ of Electro-Communications", affiliationaddress = "Jpn", classification = "723; 723.4", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Computer graphics; Computer software; Electric power control system; Multiple-window environment; Parallel manipulator; Parallel-concurrent computer system; Prototype visualization system vogue; Shapeless software visualization; User's cognitive load", wwwtitle = "The Roles of Another Spatial Dimension in Software Visualization", } @Article{Shaw:1993:DSV, author = "Chris Shaw and Mark Green and Jiandong Liang and Yunqi Sun", title = "Decoupled Simulation in Virtual Reality with the {MR} Toolkit", journal = j-TOIS, volume = "11", number = "3", pages = "287--317", month = jul, year = "1993", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", note = "Special Issue on Virtual Worlds.", URL = "http://www.acm.org:80", abstract = "The Virtual Reality (VR) user interface style allows natural hand and body motions to manipulate virtual objects in 3D environments using one or more 3D input devices. This style is best suited to application areas", acknowledgement = ack-nhfb, affiliation = "Univ of Alberta", affiliationaddress = "Can", classification = "723; 723.4", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Computer software; Decoupled simulation model (dsm); Interactive computer graphics; Interactive three dimensional graphics; User interface software; Virtual object manipulations; Virtual reality (VR) user interface style; Virtual storage", } @Article{Malone:1993:GE, author = "Thomas Malone and Norbert Streitz", title = "Guest Editorial", journal = j-TOIS, volume = "11", number = "4", pages = "319--320", month = oct, year = "1993", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:02:45 MST 1999", bibsource = "http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", note = "Special Issue on Computer-Supported Cooperative Work (CSCW).", URL = "http://www.acm.org:80", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Olson:1993:GCC, author = "Judith S. Olson and Gary M. Olson and Marianne Storrosten and Mark Carter", title = "Groupwork Close Up: a Comparison of the Group Design Process With and Without a Simple Group Editor", journal = j-TOIS, volume = "11", number = "4", pages = "321--348", month = oct, year = "1993", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", note = "Special Issue on Computer-Supported Cooperative Work (CSCW).", URL = "http://www.acm.org:80", abstract = "A simple collaborative tool, a shared text editor called ShrEdit, changed the way groups of designers performed their work, and changed it for the better. First, the designs produced by the 19 groups of three designers were of higher quality than those of the 19 groups who worked with conventional whiteboard, paper and pencil. The groups with the new tool reported liming their work process a little less, probably because they had to adapt their work style to a new tool. We expected, from the brainstorming literature and recent work on Group Support Systems, that the reason the designs were of better quality was that the supported groups generated more ideas. To our surprise, the groups working with ShrEdit generated fewer design ideas, but apparently better ones. It appears that the tool helped the supported groups keep more focused on the core issues in the emerging design, to waste less time on less important topics, and to capture what was said as they went. This suggests that small workgroups can capitalize on the free access they have to a shared workspace, without requiring a facilitator or a work process embedded in the software.", acknowledgement = ack-nhfb, affiliation = "Univ of Michigan", affiliationaddress = "Ann Arbor, MI, USA", classification = "723; 903", conferenceyear = "1993", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Computer software; Concurrent editing; Decision support systems; Design; Group behavior; Group support system; Groupwork; Information science; Management information systems", } @Article{Ishii:1993:IIS, author = "Hiroshi Ishii and Minoru Kobayashi and Jonathan Grudin", title = "Integration of Interpersonal Space and Shared Workspace; {ClearBoard} Design and {Experiments}", journal = j-TOIS, volume = "11", number = "4", pages = "349--375", month = oct, year = "1993", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", note = "Special Issue on Computer-Supported Cooperative Work (CSCW).", URL = "http://www.acm.org:80", abstract = "We describe the evolution of the novel shared drawing medium clearBoard which was designed to seamlessly integrate an intrapersonal space and a shared workspace. ClearBoard permits coworkers in two locations to draw with color markers or with electronic pens and software tools while maintaining direct eye contact and the ability to employ natural gestures. The ClearBoard design is based on the key metaphor of `talking through and drawing on a transparent glass window'. We describe the evolution from ClearBoard-1 (which enables shared video drawing) to ClearBoard-2 (which incorporates TeamPaint, a multiuser paint editor). Initial observations and findings gained through the experimental use of the prototype, including the feature of `gaze awareness', are discussed. Further experiments are conducted with ClearBoard-0 (a simple mockup), ClearBoard-1, and an actual desktop as a control. IN the settings we examined, the ClearBoard environment led to more eye contact and potential awareness of collaborator's gaze direction over the traditional desktop environment.", acknowledgement = ack-nhfb, affiliation = "NTT Human Interface Laboratories", classification = "723; 903", conferenceyear = "1993", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Computer software; Decision support systems; Gaze awareness; Groupware; Information science; Interfaces (computer); Interpersonal space; management information systems; Shared workspace; Teleconferencing", } @Article{Hindus:1993:CSR, author = "Debby Hindus and Chris Schmandt and Chris Horner", title = "Capturing, Structuring, and Representing Ubiquitous Audio", journal = j-TOIS, volume = "11", number = "4", pages = "376--400", month = oct, year = "1993", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", note = "Special Issue on Computer-Supported Cooperative Work (CSCW).", URL = "http://www.acm.org:80", abstract = "Although talking is an integral part of collaboration, there has been little computer support for acquiring and accessing the contents of conversations. Our approach has focused on ubiquitous audio, or the unobtrusive capture of speech interactions in everyday work environments. Speech recognition technology cannot yet transcribe fluent conversational speech, so the words themselves are not available for organizing the captured interactions. Instead, the structure of an interaction is derived from acoustical information inherent in the stored speech and augmented by user interaction during or after capture. This article describes applications for capturing and structuring audio from office discussions and telephone calls, and mechanisms for later retrieval of these stored interactions. An important aspect of retrieval is choosing an appropriate visual representation, and this article describes the evolution of a family of representations across a range of applications. Finally, this work is placed within the broader context of desktop audio, mobile audio applications, and social implications.", acknowledgement = ack-nhfb, affiliation = "Interval Research Corporation", affiliationaddress = "Palo Alto, CA, USA", classification = "723; 752; 903", conferenceyear = "1993", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Audio systems; Collaborative work; Computer software; Decision support systems; Information retrieval systems; Interfaces (computer); Multimedia workstation; Software telephony; Teleconferencing; Ubiquitous audio", } @Article{Resnick:1993:PBC, author = "Paul Resnick", title = "Phone-Based {CSCW}: Tools and Trials", journal = j-TOIS, volume = "11", number = "4", pages = "401--424", month = oct, year = "1993", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", note = "Special Issue on Computer-Supported Cooperative Work (CSCW).", URL = "http://www.acm.org:80", abstract = "Telephones are the most ubiquitous, best-networked, and simplest computer terminals available today. They have been used for voice mail but largely overlooked as a platform for asynchronous cooperative-work applications such as event calendars, issue discussions, and question-and-answer gathering. HyperVoice is a software toolkit for constructing such applications. Its building blocks are high-level presentation formats for collections of structured voice messages. The presentation formats can themselves be presented and manipulated, enabling significant customization of applications by phone. Results of two field trials suggest social-context factors that will influence the success or failure of phone-based cooperative work applications in particular settings.", acknowledgement = ack-nhfb, classification = "716; 723; 903", conferenceyear = "1993", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Asynchronous cooperative work; Computer networks; Computer programming; Computer software; Phone based interface; Software toolkit; Telephone systems; User interfaces; Voice/data communication systems", } @Article{Anonymous:1993:AI, author = "Anonymous", title = "1993 Author Index", journal = j-TOIS, volume = "11", number = "4", pages = "425--426", month = oct, year = "1993", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:02:45 MST 1999", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Allen:1994:E, author = "Robert B. Allen", title = "Editorial", journal = j-TOIS, volume = "12", number = "1", pages = "1--1", month = jan, year = "1994", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:02:45 MST 1999", bibsource = "http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Anonymous:1994:TC, author = "Anonymous", title = "{TOIS} Charter", journal = j-TOIS, volume = "12", number = "1", pages = "3--3", month = jan, year = "1994", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 16:21:56 MST 1999", bibsource = "http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Marchionini:1994:EHL, author = "Gary Marchionini and Gregory Crane", title = "Evaluating Hypermedia and Learning: Methods and Results from the {Perseus Project}", journal = j-TOIS, volume = "12", number = "1", pages = "5--34", month = jan, year = "1994", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "The Perseus Project has developed a hypermedia corpus of materials related to the ancient Greek world. The materials include a variety of texts and images, and tools for using these materials and navigating the system. Results from a three-year evaluation of Perseus use in a variety of college settings are described. The evaluation assessed both this particular system and the application of the technological genre to information management and to learning.", acknowledgement = ack-nhfb, affiliation = "Univ of Maryland", affiliationaddress = "College Park, MD, USA", classification = "403.2; 461.4; 723.5; 912.2", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Computer milieux; Human computer interaction; Human engineering; Human information processing; Hypermedia; Information science; Learning systems; Logic design; Machine systems; Navigation systems", } @Article{Poulovassilis:1994:NGM, author = "Alexandra Poulovassilis and Mark Levene", title = "A Nested-Graph Model for the Representation and Manipulation of Complex Objects", journal = j-TOIS, volume = "12", number = "1", pages = "35--68", month = jan, year = "1994", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "Three recent trends in database research are object-oriented and deductive databases and graph-based user interfaces. We draw these trends together in a data model we call the Hypernode Model. The single data structure of this model is the hypernode, a graph whose nodes can themselves be graphs. Hypernodes are typed, and types, too, are nested graphs. We give the theoretical foundations of hypernodes and types, and we show that type checking is tractable. We show also how conventional type-forming operators can be simulated by our graph types, including cyclic types. The Hypernode Model comes equipped with a rule-based query language called Hyperlog, which is complete with respect to computation and update. We define the operational semantics of Hyperlog and show that the evaluation of Hyperlog programs is intractable in the general case--we identify cases when evaluation can be performed efficiently.", acknowledgement = ack-nhfb, affiliation = "King's College", affiliationaddress = "London, Engl", classification = "721.2; 723.2; 723.4; 723.5", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Computer graphics; Computer networks; Computer programming; Data processing; Database browsing; Database management; Expert systems; Hyperlog programs; Hypernode project; Logic design; Nested graph", } @Article{Schauble:1994:EPQ, author = "Peter Schauble and Beat Wuthrich", title = "On the Expressive Power of Query Languages", journal = j-TOIS, volume = "12", number = "1", pages = "69--91", month = jan, year = "1994", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "Two main topics are addressed. First, an algebraic approach is presented to define a general notion of expressive power. Heterogeneous algebras represent information systems and morphisms represent the correspondences between the instances of databases, the correspondences between answers, and the correspondences between queries. An important feature of this new notion of expressive power is that query languages of different types can be compared with respect to their expressive power.", acknowledgement = ack-nhfb, affiliation = "Swiss Federal of Technology", affiliationaddress = "Zurich, Switz", classification = "721.1; 721.2; 723.4; 723.5", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Abstract data; Artificial intelligence; Computation theory; Computer programming; Datalog; Heterogeneous algebra; Information science; Logic design; Query correspondence; Query languages; Recursion", } @Article{Fuhr:1994:PIR, author = "Norbert Fuhr and Ulrich Pfeifer", title = "Probabilistic Information Retrieval as a Combination of Abstraction, Inductive Learning, and Probabilistic Assumptions", journal = j-TOIS, volume = "12", number = "1", pages = "92--115", month = jan, year = "1994", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "We show that former approaches in probabilistic information retrieval are based on one or two of the three concepts abstraction, inductive learning, and probabilistic assumptions, and we propose a new approach which combines all three concepts. This approach is illustrated for the case of indexing with a controlled vocabulary. For this purpose, we describe a new probabilistic model first, which is then combined with logistic regression, thus yielding a generalization of the original model.", acknowledgement = ack-nhfb, affiliation = "Univ of Dortmund", affiliationaddress = "Dortmund, Ger", classification = "721.2; 723.2; 723.4; 723.5", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Abstraction; Artificial intelligence; Data feedback; Data storage equipment; Information science; Interactive devices; Learning systems; Logic design; Logistic regression; Probabilistic information; Probabilistic retrieval", wwwtitle = "Probabilistic Information Retrieval as Combination of Abstraction, Inductive Learning and Probabilistic Assumptions", } @Article{Kling:1994:ISI, author = "R. Kling", title = "Introduction to the Special Issue on Social Science Perspectives on {IS}", journal = j-TOIS, volume = "12", number = "2", pages = "117--118", month = apr, year = "1994", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 16:21:56 MST 1999", bibsource = "http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Markus:1994:FHM, author = "M. L. Markus", title = "Finding a Happy Medium: Explaining the Negative Effects of Electronic Communication on Social Life at Work", journal = j-TOIS, volume = "12", number = "2", pages = "119--149", month = apr, year = "1994", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "The sometimes observed negative social effects of electronic communication technology are often attributed to the characteristics of the technology itself. Electronic mail, for instance, filters out personal and social cues and provides new capabilities not found in traditional media,and it has been argued that these factors have consequences such as `flaming' and depersonalization. Alternative theoretical perspectives on the impacts of information technology suggest that our ability to explain these outcomes might be enhanced by attending to user's intentional choices about how to use technology and to the unpredictable technology usage patterns that emerge when users interact with the technology and each other. These alternative perspectives are examined in the context of an exploratory case study of a complex organization in which electronic mail was heavily used.", acknowledgement = ack-nhfb, affiliation = "The Calemont Graduate School", affiliationaddress = "Claremont, CA, USA", classification = "718.1; 903.2; 903.4", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Depersonalization; Electronic communication; Electronic mail; Information services; Negative effects; Social life at work; Telecommunication systems", wwwtitle = "Finding a Happy Medium: Explaining the Effects of Electronic Mail on Social Life at Work", } @Article{Walsham:1994:ISS, author = "G. Walsham and T. Waema", title = "Information Systems Strategy and Implementation: a Case Study of a Building Society", journal = j-TOIS, volume = "12", number = "2", pages = "150--173", month = apr, year = "1994", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "The formation and implementation of strategy with respect to computer-based information systems (IS) are important issues in many contemporary organizations, including those in the financial services sector. This paper describes and analyzes an in-depth case study of the strategy formation and implementation process in one such organization, a medium-sized UK building society, and relates the process to its organizational and broader contexts; the organization is examined over a period of several years and under the contrasting leadership of two different chief executives. The case study is used to develop some general implications on IS strategy and implementation, which can be taken as themes for debate in any new situation. The paper provides an example of a more detailed perspective on processes in IS strategy and implementation than typically available in the literature. In addition, a new framework for further research in this area is developed, which directs the researcher toward exploring the dynamic interplay of strategic content, multilevel contexts, and cultural and political perspectives on the process of change.", acknowledgement = ack-nhfb, affiliation = "Univ of Cambridge", affiliationaddress = "Cambridge, Engl", classification = "723.5; 903.2; 903.4", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Computer applications; Implementation; Information dissemination; Information services; Information systems strategy; Multilevel context", } @Article{Orlikowski:1994:TFM, author = "Wanda J. Orlikowski and Debra C. Gash", title = "Technological Frames: Making Sense of Information Technology in Organizations", journal = j-TOIS, volume = "12", number = "2", pages = "174--207", month = apr, year = "1994", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "In this article, we build on and extend research into the cognitions and values of users and designers by proposing a systematic approach for examining the underlying assumptions. expectations, and knowledge that people have about technology. Such interpretations of technology (which we call technological (frames)) are central to understanding technological development, use, and change in organizations. We suggest that where the technological frames of key groups in organizations---such as managers, technologists, and change of technology may result. We use the findings of an empirical study to illustrate how the nature, value, and use of a groupware technology were interpreted by various organizational stakeholders, resulting in outcomes that deviated from those expected. We argue that technological frames offer an interesting and useful analytic perspective for explaining and anticipating actions and meanings that are not easily obtained with other theoretical lenses.", acknowledgement = ack-nhfb, affiliation = "Massachusetts Institute of Technology", affiliationaddress = "Cambridge, MA, USA", classification = "716.1; 723.5; 903.4", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Human factors; Information science; Information services; Organizations; Technological frames; Technology", } @Article{Ruhleder:1994:RLR, author = "Karen Ruhleder", title = "Rich and Lean Representations of Information for Knowledge Work: The Role of Computing Packages in the Work of Classical Scholars", journal = j-TOIS, volume = "12", number = "2", pages = "208--230", month = apr, year = "1994", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "Applying information systems to complex intellectual tasks requires the representation and codification of ambiguous and fragmentary forms of data. This application effects changes not only in representation of this data, but in the relationships between users and tools, techniques, or systems for data interpretation. It also affects the complex infrastructures that support this process. This article uses a package metaphor to examine the impact on one domain of knowledge work, classical scholarship, of the `computerization' of a key data source, the textual edition. The construction of one on-line textual databank, the Thesaurus Linguae Graecae (TLG), has altered the traditional relationships between text `owners' and `users', has changed the role of the text as a conduit for social and historical information, and has disrupted traditional patterns of transmitting domain expertise. A rich information resource has become lean in its electronic form.", acknowledgement = ack-nhfb, affiliation = "Worcester Polytechnic Institute", affiliationaddress = "Worcester, MA, USA", classification = "723.5; 903.3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Classical scholars; Computer applications; Computing packages; Information retrieval systems; Information science; Lean representation; Rich representation", } @Article{Lewis:1994:GE, author = "D. D. Lewis and P. J. Hayes", title = "Guest Editorial", journal = j-TOIS, volume = "12", number = "3", pages = "231--233", month = jul, year = "1994", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 16:21:56 MST 1999", bibsource = "http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", note = "Special Issue on Text Categorization.", URL = "http://www.acm.org:80", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Apte:1994:ALD, author = "Chidanand Apte and Fred Damerau and Sholom M. Weiss", title = "Automated Learning of Decision Rules for Text Categorization", journal = j-TOIS, volume = "12", number = "3", pages = "233--251", month = jul, year = "1994", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", note = "Special Issue on Text Categorization.", URL = "http://www.acm.org:80", abstract = "We describe the results of extensive experiments using optimized rule-based induction methods on large document collections. The goal of these methods is to discover automatically classification patterns that can be used for general document categorization or personalized filtering of free text. Previous reports indicate that human-engineered rule-based systems, requiring many man-years of developmental efforts, have been successfully built to `read' documents and assign topics to them. We show that machine-generated decision rules appear comparable to human performance, while using the identical rule-based representation. In comparison with other machine-learning techniques, results on a key benchmark from the Reuters collection show a large gain in performance, from a previously reported 67\% recall\slash precision breakeven point to 80.5\%. In the context of a very high-dimensional feature space, several methodological alternatives are examined, including universal versus local dictionaries, and binary versus frequency-related features.", acknowledgement = ack-nhfb, affiliation = "IBM T. J. Watson Research Cent", affiliationaddress = "Yorktown Heights, NY, USA", classification = "461.4; 722.1; 723.4; 901.1.1; 902.2; 903.1", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Classification (of information); Data acquisition; Data storage equipment; Decision support systems; Human engineering; Information retrieval systems; Knowledge based systems; Learning systems; Man machine systems; Performance; Reuters collection; Societies and institutions; Standards; Terminology; Text categorization", } @Article{Yang:1994:EBM, author = "Yiming Yang and Christopher G. Chute", title = "An Example-Based Mapping Method for Text Categorization and Retrieval", journal = j-TOIS, volume = "12", number = "3", pages = "252--277", month = jul, year = "1994", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", note = "Special Issue on Text Categorization.", URL = "http://www.acm.org:80", abstract = "A unified model for text categorization and text retrieval is introduced. We use a training set of manually categorized documents to learn word-category associations, and use these associations to predict the categories of arbitrary documents. Similarly, we use a training set of queries and their related documents to obtain empirical associations between query words and indexing terms of documents, and use these associations to predict the related documents of arbitrary queries. A Linear Least Squares Fit (LLSF) technique is employed to estimate the likelihood of these associations. Document collections from the MEDLINE database and Mayo patient records are used for studies on the effectiveness of our approach, and on how much the effectiveness depends on the choices of training data, indexing language, word-weighting scheme, and morphological canonicalization. Alternative methods are also tested on these data collections for comparison. It is evident that the LLSF approach uses the relevance information effectively within human decisions of categorization and retrieval, and achieves a semantic mapping of free texts to their representations in an indexing language. Such a semantic mapping leads to a significant improvement in categorization and retrieval, compared to alternative approaches.", acknowledgement = ack-nhfb, affiliation = "Mayo Clinic\slash Foundation", affiliationaddress = "Rochester, MN, USA", classification = "721.1; 723.2; 723.3; 903.1; 903.3; 921.6", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Classification (of information); Computational linguistics; Data acquisition; Database systems; Human engineering; Indexing (of information); Information analysis; Information retrieval; Learning systems; Least squares approximations; Mapping; Mathematical models; Morphological canonicalization; Query languages; Text categorization; Text retrieval", } @Article{Liddy:1994:TCM, author = "Elizabeth D. Liddy and Woojin Paik and Edmund S. Yu", title = "Text Categorization for Multiple Users Based on Semantic Features from a Machine-Readable Dictionary", journal = j-TOIS, volume = "12", number = "3", pages = "278--295", month = jul, year = "1994", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", note = "Special Issue on Text Categorization.", URL = "http://www.acm.org:80", abstract = "The text categorization module described here provides a front-end filtering function for the larger DR-LINK text retrieval system [Liddy and Myaeng 1993]. The module evaluates a large incoming stream of documents to determine which documents are sufficiently similar to a profile at the broad subject level to warrant more refined representation and matching. To accomplish this task, each substantive word in a text is first categorized using a feature set based on the semantic Subject Field Codes (SFCs) assigned to individual word senses in a machine-readable dictionary. When tested on 50 user profiles and 550 megabytes of documents, results indicate that the feature set that is the basis of the text categorization module and the algorithm that establishes the boundary of categories of potentially relevant documents accomplish their tasks with a high level of performance. This means that the category of potentially relevant documents for most profiles would contain at least 80\% of all documents later determined to be relevant to the profile. The number of documents in this set would be uniquely determined by the system's category-boundary predictor, and this set is likely to contain less than 5\% of the incoming stream of documents.", acknowledgement = ack-nhfb, affiliation = "Syracuse Univ", affiliationaddress = "Syracuse, NY, USA", classification = "721.1; 903.1; 903.3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Abstracting; Algorithms; Classification (of information); Codes (symbols); Computational linguistics; Encoding (symbols); Indexing (of information); Information retrieval systems; Machine readable dictionary; Performance; Semantic features; Semantic vectors; Subject field coding; Terminology; Text categorization; User interfaces", } @Article{Riloff:1994:IEB, author = "Ellen Riloff and Wendy Lehnert", title = "Information Extraction as a Basis for High-Precision Text Classification", journal = j-TOIS, volume = "12", number = "3", pages = "296--333", month = jul, year = "1994", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", note = "Special Issue on Text Categorization.", URL = "http://www.acm.org:80", abstract = "We describe an approach to text classification that represents a compromise between traditional word-based techniques and in-depth natural language processing. Our approach uses a natural language processing task called `information extraction' as a basis for high-precision text classification. We present three algorithms that use varying amounts of extracted information to classify texts. The relevancy signatures algorithm uses linguistic phrases; the augmented relevancy signatures algorithm uses phrases and local context; and the case-based text classification algorithm uses larger pieces of context. Relevant phrases and contexts are acquired automatically using a training corpus. We evaluate the algorithms on the basis of two test sets from the MUC-4 corpus. All three algorithms achieved high precision on both test sets, with the augmented relevancy signatures algorithm and the case-based algorithm reaching 100\% precision with over 60\% recall on one set. Additionally, we compare the algorithms on a larger collection of 1700 texts and describe an automated method for empirically deriving appropriate threshold values. The results suggest that information extraction techniques can support high-precision text classification and, in general, that using more extracted information improves performance. As a practical matter, we also explain how the text classification system can be easily ported across domains.", acknowledgement = ack-nhfb, affiliation = "Univ of Massachusetts", affiliationaddress = "Amherst, MA, USA", classification = "721.1; 723.2; 903.1; 903.3; 922.2", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Algorithms; Augmented relevancy signatures algorithms; Case based text classification; Classification (of information); Computational linguistics; Data acquisition; Indexing (of information); Information analysis; Information extraction; Information retrieval; Natural language processing systems; Online searching; Phrases; Statistical methods; Training corpus", wwwpages = "296--337", wwwtitle = "Information Extraction as a Basis for High-Precision Text", } @Article{Anonymous:1994:IA, author = "Anonymous", title = "Information for Authors", journal = j-TOIS, volume = "12", number = "3", pages = "333--337", month = jul, year = "1994", bibdate = "Mon Jan 18 12:02:07 1999", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Merz:1994:DQF, author = "Ulla Merz and Roger King", title = "{DIRECT}: a Query Facility for Multiple Databases", journal = j-TOIS, volume = "12", number = "4", pages = "339--359", month = oct, year = "1994", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "The subject of this research project is the architecture and design of a multidatabase query facility. These databases contain structured data, typical for business applications. Problems addressed are: presenting a uniform interface for retrieving data from multiple databases, providing autonomy for the component databases, and defining an architecture for semantic services. DIRECT is a query facility for heterogeneous databases. The databases and their definitions can differ in their data models, names, types, and encoded values. Instead of creating a global schema, descriptions of different databases are allowed to coexist. A multidatabase query language provides a uniform interface for retrieving data from different databases. DIRECT has been exercised with operational databases that are part of an automated business system.", acknowledgement = ack-nhfb, affiliation = "Univ of Colorado", affiliationaddress = "Boulder, CO, USA", classification = "721.1; 723.1; 723.2; 723.3; 903.3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Computational linguistics; Computer architecture; Data models; Data structures; direct query facility; Heterogeneous databases; Information retrieval; Interfaces (computer); Multiple databases; Query languages", } @Article{Chang:1994:SAB, author = "Man Kit Chang and Carson C. Woo", title = "A Speech Act Based Negotiation Protocol: Design, Implementation, and Test Use", journal = j-TOIS, volume = "12", number = "4", pages = "360--382", month = oct, year = "1994", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "Existing negotiation protocols used in Distributed Artificial Intelligence (DAI) systems rarely take into account the results from negotiation research. We propose a negotiation protocol, SANP (Speech-Act-based Negotiation Protocol), which is based on Ballmer and Brennenstuhl's speech act classification and on negotiation analysis literature. The protocol is implemented as a domain-independent system using Strudel, which is an electronic mail toolkit. A small study tested the potential use of the protocol. Although a number of limitations were found in the study, the protocol appears to have potential in domains without these limitations, and it can serve as a building block to design more general negotiation protocols.", acknowledgement = ack-nhfb, affiliation = "Hong Kong Baptist Coll", affiliationaddress = "Hong Kong", classification = "722.3; 722.4; 723.1; 723.4; 723.5; 903.3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Artificial intelligence; Data communication systems; Data structures; Distributed artificial intelligence; Distributed computer systems; Electronic mail; Expert systems; Information retrieval systems; Network protocols; Office automation; Organizational computing systems; Societies and institutions; Speech act based negotiation protocol", } @Article{Chimera:1994:EET, author = "Richard Chimera and Ben Shneiderman", title = "An Exploratory Evaluation of Three Interfaces for Browsing Large Hierarchical Tables of Contents", journal = j-TOIS, volume = "12", number = "4", pages = "383--406", month = oct, year = "1994", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "Three different interfaces were used to browse a large (1296 items) table of contents. A fully expanded stable interface, expand\slash contract interface, and multipane interface were studied in a between-groups experiment with 41 novice participants. Nine timed fact retrieval tasks were performed; each task is analyzed and discussed separately. We found that both the expand\slash contract and multipane interfaces produced significantly faster times than the stable interface for many tasks using this large hierarchy; other advantages of the expand\slash contract and multipane interfaces over the stable interface are discussed. The animation characteristics of the expand\slash contract interface appear to play a major role. Refinements to the multipane and expand\slash contract interfaces are suggested. A predictive model for measuring navigation effort of each interface is presented.", acknowledgement = ack-nhfb, affiliation = "Univ of Maryland", affiliationaddress = "College Park, MD, USA", classification = "461.4; 722.2; 723.2; 903.2", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Expand/contract interfaces; Hierarchical systems; Hierarchical tables of contents; Human engineering; Man machine systems; Multipane interfaces; Online searching; User interfaces", wwwauthor = "B. Shneiderman and R. Chimera", wwwtitle = "Evaluation of Three Interfaces for Browsing Hierarchical Tables of Contents", } @Article{Wong:1994:PBD, author = "Stephen T. C. Wong", title = "Preference-Based Decision Making for Cooperative Knowledge-Based Systems", journal = j-TOIS, volume = "12", number = "4", pages = "407--435", month = oct, year = "1994", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "Recent advances in cooperative knowledge-based systems (CKBS) offer significant promise for intelligent interaction between multiple AI systems for solving larger, more complex problems. In this paper, we propose a logical, qualitative problem-solving scheme for CKBS that uses social choice theory as a formal basis for making joint decisions and promoting conflict resolution. This scheme consists of three steps: (1) the selection of decision criteria and competing alternatives, (2) the formation of preference profiles and collective choices, and (3) the negotiation among agents as conflicts arise in group decision making. In this paper, we focus on the computational mechanisms developed to support steps (2) and (3) of the scheme. In addition, the practicality of the scheme is illustrated with examples taken from a working prototype dealing with collaborative structural design of buildings.", acknowledgement = ack-nhfb, affiliation = "Inst for New Generation Computer Technology", affiliationaddress = "Tokyo, Jpn", classification = "461.4; 723.2; 723.4; 723.4.1; 903.3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Artificial intelligence; Cooperative knowledge based systems; Decision support systems; Distributed artificial intelligence; Heuristic methods; Human engineering; Information retrieval systems; Knowledge based systems; Preference based decision making; Social choice theory", wwwtitle = "Cooperative Decision Making Based on Preferences", } @Article{Isakowitz:1995:TLP, author = "Tom{\'a}s Isakowitz and Shimon Schocken and Henry C. {Lucas, Jr.}", title = "Toward a Logical\slash Physical Theory of Spreadsheet Modeling", journal = j-TOIS, volume = "13", number = "1", pages = "1--37", month = jan, year = "1995", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "In spite of the increasing sophistication and power of commercial spreadsheet packages, we still lack a formal theory or a methodology to support the construction and maintenance of spreadsheet models. Using a dual logical\slash physical perspective, we identify four principal components that characterize any spreadsheet model: schema, data, editorial, and binding. We present a factoring algorithm for identifying and extracting these components from conventional spreadsheets with minimal user intervention, and a synthesis algorithm that assists users in the construction of executable spreadsheets from reusable model components. This approach opens new possibilities for applying object-oriented and model management techniques to support the construction, sharing, and reuse of spreadsheet models in organizations. Importantly, our approach to model management and the Windows-based prototype that we have developed are designed to coexist with, rather than replace, traditional spreadsheet programs. In other words, the users are not required to learn a new modeling language; instead, their logical models and data sets are extracted from their spreadsheets transparently, as a side-effect of using standard spreadsheet programs.", acknowledgement = ack-nhfb, affiliation = "New York Univ", classification = "723.1; 723.1.1; 723.2; 723.5", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Algorithms; Computer programming languages; Computer simulation; Computer software; Data reduction; Data structures; Factoring algorithm; Model management; Spreadsheet modeling theory; Spreadsheets", } @Article{Wong:1995:MIR, author = "S. K. M. Wong and Y. Y. Yao", title = "On Modeling Information Retrieval with Probabilistic Inference", journal = j-TOIS, volume = "13", number = "1", pages = "38--68", month = jan, year = "1995", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "This article examines and extends the logical models of information retrieval in the context of probability theory. The fundamental notions of term weights and relevance are given probabilistic interpretations. A unified framework is developed for modeling the retrieval process with probabilistic inference. This new approach provides a common conceptual and mathematical basis for many retrieval models, such as the Boolean, fuzzy set, vector space, and conventional probabilistic models. Within this framework, the underlying assumptions employed by each model are identified, and the inherent relationships between these models are analyzed. Although this article is mainly a theoretical analysis of probabilistic inference for information retrieval, practical methods for estimating the required probabilities are provided by simple examples.", acknowledgement = ack-nhfb, affiliation = "Univ of Regina", affiliationaddress = "Regina, Sask, Can", classification = "721.1; 723.2; 903.1; 903.3; 921.1; 921.4", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Boolean algebra; Data structures; Document representation; Fuzzy sets; Indexing (of information); Information retrieval; Information theory; Mathematical models; Maximum entropy principle; Minimum entropy principle; Probabilistic logics; Probability; Similarity measures; Theorem proving; Vector space model", } @Article{Salminen:1995:THI, author = "Airi Salminen and Jean Tague-Sutcliffe and Charles McClellan", title = "From Text to Hypertext by Indexing", journal = j-TOIS, volume = "13", number = "1", pages = "69--99", month = jan, year = "1995", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "A model is presented for converting a collection of documents to hypertext by means of indexing. The documents are assumed to be semistructured, i.e., their text is a hierarchy of parts, and some of the parts consist of natural language. The model is intended as a framework for specifying hypertextual reading capabilities for specific application areas and for developing new automated tools for the conversion of semistructured text to hypertext. In the model, two well-known paradigms --- formal grammars and document indexing --- are combined. The structure of the source text is defined by a schema that is a constrained context-free grammar. The hierarchic structure of the source may thus be modeled by a parse tree for the grammar. The effect of indexing is described by grammar transformations. The new grammar, called an indexing schema, is associated with a new parse tree where some text parts are index elements. The indexing schema may hide some parts of the original documents or the structure of some parts. For information retrieval, parts of the indexed text are considered to be nodes of a hypergraph. In the hypergraph-based information access, the navigation capabilities of hypertext systems are combined with the querying capabilities of information retrieval systems.", acknowledgement = ack-nhfb, affiliation = "Univ of Jyvaskyla", affiliationaddress = "Jyvaskyla, Finl", classification = "721.1; 723.2; 903.1; 903.3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Automata theory; Constraint theory; Content analysis; Context free grammars; Data structures; Formal logic; Hypertext; Indexing (of information); Information retrieval systems; Structured text; Text entities; Transient hypergraphs", wwwpages = "69--111", } @Article{Cooper:1995:SIM, author = "William S. Cooper", title = "Some Inconsistencies and Misidentified Modeling Assumptions in Probabilistic Information Retrieval", journal = j-TOIS, volume = "13", number = "1", pages = "100--111", month = jan, year = "1995", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "Research in the probabilistic theory of information retrieval involves the construction of mathematical models based on statistical assumptions. One of the hazards inherent in this kind of theory construction is that the assumptions laid down may be inconsistent in unanticipated ways with the data to which they are applied. Another hazard is that the stated assumptions may not be those on which the derived modeling equations or resulting experiments are actually based. Both kinds of mistakes have been made in past research on probabilistic information retrieval. One consequence of these errors is that the statistical character of certain probabilistic IR models, including the so-called Binary Independence model, has been seriously misapprehended.", acknowledgement = ack-nhfb, affiliation = "Univ of California", affiliationaddress = "Berkeley, CA, USA", classification = "721.1; 722.4; 723.2; 903.3; 922.1; 922.2", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Bibliographic retrieval systems; Bibliographic searching; Binary independence model; Data structures; Document retrieval; Hazards and race conditions; Information retrieval; Online searching; Probabilistic logics; Probability; Statistical methods", wwwtitle = "Some Inconsistencies and Misidentified Modelling Assumptions in Probabilistic Information Retrieval", } @Article{Anonymous:1995:AR, author = "Anonymous", title = "Acknowledgment to Referees", journal = j-TOIS, volume = "13", number = "1", pages = "112--113", month = jan, year = "1995", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 16:21:56 MST 1999", bibsource = "http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Gudivada:1995:DEA, author = "Venkat N. Gudivada and Vijay V. Raghavan", title = "Design and Evaluation of Algorithms for Image Retrieval by Spatial Similarity", journal = j-TOIS, volume = "13", number = "2", pages = "115--144", month = apr, year = "1995", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "An algorithm for computing the spatial similarity between two symbolic images is proposed. This algorithms is simple in the sense that it can deal with translation, scale and rotational variances in images. The idea of quantifying a system's retrieval quality by having an expert specify the expected rank ordering with respect to each query for a set of test queries is also introduced. Finally, a comparison of the characteristics of the proposed algorithm with those of the previously available algorithms revealed that the proposed algorithm is more efficient and it provides a rank ordering of images that consistently matches with the expert's expected rank ordering.", acknowledgement = ack-nhfb, affiliation = "Ohio Univ", affiliationaddress = "Athens, OH, USA", classification = "721.1; 722.2; 723.1; 723.3; 903.3; 921.4", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Algorithms; Computational complexity; Database systems; Expert systems; Graph theory; Image databases; Image retrieval; Image retrieval systems; Information retrieval; Information retrieval systems; Query languages; Rotational invariance; Spatial similarity; User interfaces", wwwtitle = "An Experimental Evaluation of Algorithms for Retrieval by Spatial Similarity", } @Article{Rangan:1995:FTC, author = "P. Venkat Rangan and Srinivas Ramanathan and Srihari Sampathkumar", title = "Feedback Techniques for Continuity and Synchronization in Multimedia Information Retrieval", journal = j-TOIS, volume = "13", number = "2", pages = "145--176", month = apr, year = "1995", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "The development of techniques for supporting continuous and synchronous retrieval from multimedia servers is discussed. Several feedback techniques that remain robust even in the presence of playback rate mismatches and network delay jitter are presented. In general, the constant rate feedback techniques developed in this study form the basis of a prototype on-demand information server developed at the UCSD Multimedia Laboratory.", acknowledgement = ack-nhfb, affiliation = "Univ of California at San Diego", affiliationaddress = "La Jolla, CA, USA", classification = "722.3; 723.3; 723.5; 903.3; 903.4", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Computer networks; Computer simulation; Feedback; Information retrieval; Information retrieval systems; Information services; Intermedia synchronization; Intramedia continuity; Multimedia; Multimedia information retrieval; Synchronization", wwwauthor = "P. V. Rangan and S. Ramanathan", } @Article{Malone:1995:EOR, author = "Thomas W. Malone and Kum-Yew Lai and Christopher Fry", title = "Experiments with Oval: a Radically Tailorable Tool for Cooperative Work", journal = j-TOIS, volume = "13", number = "2", pages = "177--205", month = apr, year = "1995", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "This article describes a series of tests of the generality of a `radically tailorable' tool for cooperative work. Users of this system can create applications by combining and modifying four kinds of building blocks: objects, views, agents, and links. We found that user-level tailoring of these primitives can provide most of the functionality found in well-known cooperative work systems such as gIBIS, Coordinator, Lotus Notes, and Information Lens. These primitives, therefore, appear to provide an elementary `tailoring language' out of which a wide variety of integrated information management and collaboration applications can be constructed by end users.", acknowledgement = ack-nhfb, affiliation = "MIT Cent for Coordination Science", affiliationaddress = "Cambridge, MA, USA", classification = "722.2; 723.1; 723.1.1; 723.3; 723.5; 903", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Computer aided software engineering; Computer programming; Computer simulation; Computer supported cooperative work; End user programming; High level languages; Human engineering; Information management; Information retrieval systems; Radical tailorability; User interfaces", } @Article{Strong:1995:EEH, author = "Diane M. Strong and Steven M. Miller", title = "Exceptions and Exception Handling in Computerized Information Processes", journal = j-TOIS, volume = "13", number = "2", pages = "206--233", month = apr, year = "1995", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "Exceptions, situations that cannot be correctly processed by computer systems, occur frequently in computer-based information processes. Five perspectives on exceptions provide insights into why exceptions occur and how they might be eliminated or more efficiently handled. We investigate these perspectives using an in-depth study of an operating information process that has frequent exceptions. Our results support the use of a total quality management (TQM) approach of eliminating exceptions for some exceptions, in particular, those caused by computer systems that are poor matches to organizational processes. However, some exceptions are explained better by a political system perspective of conflicting goals between subunits. For these exceptions and several other types, designing an integrated human-computer process will provide better performance than will eliminating exceptions and moving toward an entirely automated process.", acknowledgement = ack-nhfb, affiliation = "Boston Univ", affiliationaddress = "Boston, MA, USA", classification = "722.2; 722.4; 723.2; 723.5; 912.2; 913.3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Administrative data processing; Computer applications; Computer systems; Computerized information processes; Data handling; Data processing; Exception handling; Exceptions; Human computer interaction; Office automation; Performance; Process design; Quality assurance; Total quality management", } @Article{Celentano:1995:KBD, author = "Augusto Celentano and Maria Grazia Fugini and Silvano Pozzi", title = "Knowledge-Based Document Retrieval in Office Environments: The {Kabiria} System", journal = j-TOIS, volume = "13", number = "3", pages = "237--268", month = jul, year = "1995", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "In the office environment, the retrieval of documents is performed using the concepts contained in the documents, information about the procedural context where the documents are used, and information about the regulations and laws that discipline the life of documents within a given application domain. To fulfill the requirements of such a sophisticated retrieval, we propose a document retrieval model and system based on the representation of knowledge describing the semantic contents of documents, the way in which the documents are managed by procedures and by people in the office, and the application domain where the office operates. The article describes the knowledge representation issues needed for the document retrieval system and presents a document retrieval model that captures these issues. The effectiveness of the approach is illustrated by describing a system, named Kabiria, built on top of such model. The article describes the querying and browsing environments, and the architecture of the system.", acknowledgement = ack-nhfb, affiliation = "Politecnico di Milano", affiliationaddress = "Milano, Italy", classification = "722.1; 722.4; 723.1.1; 723.2; 723.4.1; 903.3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Administrative data processing; Browser; Computational linguistics; Computer programming languages; Data reduction; Data structures; Expert systems; Hypertext; Information retrieval systems; Kabiria system; Knowledge based document retrieval; Knowledge based systems; Object orientation; Office automation; Systems analysis; User interfaces", } @Article{Tuzhilin:1995:TKB, author = "Alexander Tuzhilin", title = "{Templar}: a Knowledge-Based Language for Software Specifications Using Temporal Logic", journal = j-TOIS, volume = "13", number = "3", pages = "269--304", month = jul, year = "1995", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "A software specification language Templar is defined in this article. The development of the language was guided by the following objectives: requirements specifications written in Templar should have a clear syntax and formal semantics, should be easy for a systems analyst to develop and for an end-user to understand, and it should be easy to map them into a broad range of design specifications. Templar is based on temporal logic and on the Activity-Event-Condition-Activity model of a rule which is an extension of the Event-Condition-Activity model in active databases. The language supports a rich set of modeling primitives, including rules, procedures, temporal logic operators, events, activities, hierarchical decomposition of activities, parallelism, and decisions combined together into a cohesive system.", acknowledgement = ack-nhfb, affiliation = "New York Univ", affiliationaddress = "New York, NY, USA", classification = "721.1; 723.1.1; 723.4.1; 921.6; 922.1", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Computational linguistics; Computer hardware description languages; Computer programming languages; Database systems; Decision making; Formal logic; Hierarchical systems; Knowledge based language Templar; Knowledge based systems; Mathematical operators; Natural languages; Software engineering; Temporal logic", } @Article{Koike:1995:FVF, author = "Hideki Koike", title = "Fractal Views: a Fractal-Based Method for Controlling Information Display", journal = j-TOIS, volume = "13", number = "3", pages = "305--323", month = jul, year = "1995", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "Computer users often must view large amounts of information through video displays which are physically limited in size. Although some methods, which automatically display\slash erase information units based on their degrees of importance, have been proposed, they lack an ability to keep the total amount of displayed information nearly constant. We propose a new method for information display based on fractal theory. By regarding the information structures used in computers as complex objects, we can abstract these objects as well as control their amount. Using our method, (1) the total amount of information is kept nearly constant even when users change their focuses of attention and (2) this amount can be set flexibly. Through mathematical analysis, we show our method's ability to control the amount. An application to program display is also shown. When this method is applied to the display of structured programs, it provides fisheye-like views which integrate local details around the focal point and major landmarks further away.", acknowledgement = ack-nhfb, affiliation = "Univ of Electro-Communications", affiliationaddress = "Tokyo, Jpn", classification = "722.2; 723.1; 723.2; 723.5; 903.1; 921.6", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Computer systems programming; Data structures; Fractals; Information analysis; Information visualization; Program display; Software engineering; Systems analysis; UI theory; User interfaces", wwwpages = "305--324", } @Article{Kwok:1995:NAP, author = "K. L. Kwok", title = "A Network Approach to Probabilistic Information Retrieval", journal = j-TOIS, volume = "13", number = "3", pages = "324--353", month = jul, year = "1995", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "In this article we show how probabilistic information retrieval based on document components may be implemented as a feedforward (feedbackward) artificial neural network. The network supports adaptation of connection weights as well as the growing of new edges between queries and terms based on user relevance feedback data for training, and it reflects query modification and expansion in information retrieval. A learning rule is applied that can also be viewed as supporting sequential learning using a harmonic sequence learning rate. Experimental results with four standard small collections and a large Wall Street Journal collection (173,219 documents) show that performance of feedback improves substantially over no feedback, and further gains are obtained when queries are expanded with terms from the feedback documents. The effect is much more pronounced in small collections than in the large collection. Query expansion may be considered as a tool for both precision and recall enhancement. In particular, small query expansion levels of about 30 terms can achieve most of the gains at the low-recall high-precision region, while larger expansion levels continue to provide gains at the high-recall low-precision region of a precision recall curve.", acknowledgement = ack-nhfb, affiliation = "City Univ of New York", affiliationaddress = "Flushing, NY, USA", classification = "721.1; 723.2; 723.4; 903.1; 903.3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Data reduction; Data structures; Document focused relevance feedback; Feedback; Feedforward neural networks; Indexing (of information); Information retrieval; Learning systems; Probabilistic information retrieval; Probabilistic logics; Query expansion; Query focused relevance feedback", wwwpages = "325-354", } @Article{Kong:1995:DDI, author = "Q. Kong and G. Chen", title = "On Deductive Databases with Incomplete Information", journal = j-TOIS, volume = "13", number = "3", pages = "354--369", month = jul, year = "1995", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", abstract = "In order to extend the ability to handle incomplete information in a definite deductive database, a Horn clause-based system representing incomplete information as incomplete constants is proposed. By using the notion of incomplete constants the deductive database system handles incomplete information in the form of sets of possible values, thereby giving more information than null values. The resulting system extends Horn logic to express a restricted form of indefiniteness. Although a deductive database with this kind of incomplete information is, in fact, a subset of an indefinite deductive database system, it represents indefiniteness in terms of value incompleteness, and therefore it can make use of the existing Horn logic computation rules. The inference rules for such a system are presented, its model theory discussed, and a model theory of indefiniteness proposed. The theory is consistent with minimal model theory and extends its expressive power.", acknowledgement = ack-nhfb, affiliation = "Univ of Queensland", affiliationaddress = "Queensland, Aust", classification = "721.1; 723.1.1; 723.2; 723.3; 723.4.1", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Data structures; Database systems; Formal logic; Horn clause; Incomplete information; Inference engines; Prolog (programming language); Query evaluation; Query languages; Systems analysis", wwwpages = "355--369", wwwtitle = "On Deductive Database with Incomplete Information", } @Article{Stevens:1995:ISI, author = "Scott Stevens and Thomas Little", title = "Introduction to the Special Issue on Video Information Retrieval", journal = j-TOIS, volume = "13", number = "4", pages = "371--372", month = oct, year = "1995", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:02:45 MST 1999", bibsource = "http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", wwwauthor = "Tom Little and Scott Stevens", wwwtitle = "Guest Editors' Introduction", } @Article{Chua:1995:VRS, author = "Tat-Seng Chua and Li-Qun Ruan", title = "A Video Retrieval and Sequencing System", journal = j-TOIS, volume = "13", number = "4", pages = "373--407", month = oct, year = "1995", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", note = "Special Issue on Video Information Retrieval.", URL = "http://www.acm.org:80", abstract = "Video is an effective medium for capturing the events in the real world around us, and a vast amount of video materials exists, covering a wide range of applications. However, widespread use of video in computer applications is often impeded by the lack of effective tools to manage video information systematically. This article discusses the design and implementation of a frame-based video retrieval and sequencing system (VRSS). The system is designed to support the entire process of video information management: segmenting, indexing, retrieving, and sequencing of video data. A semiautomatic tool is developed to divide video sequences into meaningful shots. Each video shot is logged using text descriptions, audio dialogue, and cinematic attributes. A two-layered, concept-based model is used as the basis for accurately retrieving relevant video shots based on users' free-text queries. A cinematic, rule-based, virtual editing tool is also developed to sequence the video shots retrieved for presentation within a specified time constraint. The system has been tested on a video documentary on the NUS (National University of Singapore) engineering faculty. The results of video retrieval experiments are encouraging.", acknowledgement = ack-nhfb, affiliation = "Natl Univ of Singapore", affiliationaddress = "Singapore, Singapore", classification = "722.2; 723.2; 723.3; 723.4.1; 723.5; 903.3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Cinematic rules; Computer simulation; Data structures; Frame based modeling; Image segmentation; Indexing (of information); Information management; Information retrieval; Information retrieval systems; Knowledge based systems; Knowledge representation; Multimedia; Query languages; Systems analysis; User interfaces; Video; Video retrieval; Video retrieval and sequencing system; Video signal processing; Virtual editing", } @Article{Dimitrova:1995:MRV, author = "Nevenka Dimitrova and Forouzan Golshani", title = "Motion Recovery for Video Content Classification", journal = j-TOIS, volume = "13", number = "4", pages = "408--439", month = oct, year = "1995", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", note = "Special Issue on Video Information Retrieval.", URL = "http://www.acm.org:80", abstract = "Like other types of digital information, video sequences must be classified based on the semantics of their contents. A more-precise and completer extraction of semantic information will result in a more-effective classification. The most-discernible difference between still images and moving pictures stems from movements and variations. Thus, to go from the realm of still-image repositories to video databases, we must be able to deal with motion. Particularly, we need the ability to classify objects appearing in a video sequence based on their characteristics and features such as shape or color, as well as their movements. By describing the movements that we derive from the process of motion analysis, we introduce a dual hierarchy consisting of spatial and temporal parts for video sequence representation. This gives us the flexibility to examine arbitrary sequences of frames at various levels of abstraction and to retrieve the associated temporal information (say, object trajectories) in addition to the spatial representation. Our algorithm for motion detection uses the motion compensation component of the MPEG video-encoding scheme and then computes trajectories for objects of interest. The specification of a language for retrieval of video based on the spatial as well as motion characteristics is presented.", acknowledgement = ack-nhfb, affiliation = "Arizona State Univ", affiliationaddress = "Tempe, AZ, USA", classification = "723.1; 723.1.1; 723.2; 723.3; 903.1; 903.3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Algorithms; Classification (of information); Computer hardware description languages; Database systems; Feature extraction; Image analysis; Image coding; Information retrieval; Motion pictures; Motion recovery; mpeg; Object recognition; Video analysis; Video content classification; Video databases; Video retrieval; Video sequence; Video signal processing", } @Article{Bulterman:1995:EVH, author = "Dick C. A. Bulterman", title = "Embedded Video in Hypermedia Documents: Supporting Integration and Adaptive Control", journal = j-TOIS, volume = "13", number = "4", pages = "440--470", month = oct, year = "1995", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", note = "Special Issue on Video Information Retrieval.", URL = "http://www.acm.org:80", abstract = "As the availability of digital video becomes commonplace, a shift in application focus will occur from merely accessing video as an independent data stream to embedding video with other multimedia data types into coordinated hypermedia presentations. The migration to embedded video will present new demands on application and support environments: processing of any one piece of video data will depend on how that data relates to other data streams active within the same presentation. This article describes presentation, synchronization, and interaction control issues for manipulating embedded video. First we describe the requirements for embedded video, contrasted against other forms of video use. Next we consider mechanisms for describing and implementing the behavior of embedded-video segments relative to other data items in a document; these relationships form the basis of implementing cooperative control among the events in a presentation. Finally we consider extending the possibilities for tailoring embedded video to the characteristics of the local runtime environment; this forms the basis for adaptive, application-level quality-of-service control of a presentation. In all cases, we describe a mechanism to externalize the behavior of hypermedia presentations containing resource-intensive data requirements so that effective control can be implemented by low-level system facilities based on application-specific requirements. We present our results in terms of the CMIFed authoring\slash presentation system.", acknowledgement = ack-nhfb, affiliation = "Centrum voor Wiskunde en Informatica", affiliationaddress = "Amsterdam, Neth", classification = "723.1; 723.2; 731.1; 903.3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Adaptive control systems; Algorithms; Data processing; Embedded video; Hypermedia documents; Information retrieval systems; Multimedia; Synchronization; Systems analysis; Video presentation; Video signal processing", } @Article{Keller:1995:XAI, author = "Ralf Keller and Wolfgang Effelsberg and Bernd Lamparter", title = "{XMovie}: Architecture and Implementation of a Distributed Movie System", journal = j-TOIS, volume = "13", number = "4", pages = "471--499", month = oct, year = "1995", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", note = "Special Issue on Video Information Retrieval.", URL = "http://www.acm.org:80", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", } @Article{Anonymous:1996:MGS, author = "Anonymous", title = "In Memoriam: {Gerard Salton}", journal = j-TOIS, volume = "14", number = "1", pages = "1--1", month = jan, year = "1996", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 17:28:08 1999", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Lucarella:1996:VRE, author = "Dario Lucarella and Antonella Zanzi", title = "A Visual Retrieval Environment for Hypermedia Information Systems", journal = j-TOIS, volume = "14", number = "1", pages = "3--29", month = jan, year = "1996", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80/tois/abstracts/lucarella.html", abstract = "A graph-based object model that may be used as a uniform framework for direct manipulation of multimedia information is presented. After motivating the need for abstraction and structuring mechanisms in hypermedia systems, the notion of perspective is introduced, which is a form of data abstraction that acts as a user interface to the system, providing control over the visibility of the objects and their properties. Presented is a visual retrieval environment that effectively combines filtering, browsing, and navigation to provide an integrated view of the retrieval problem. Design and implementation issues are outlined for MORF (Multimedia Object Retrieval Environment), a prototype system relying on the proposed model. The focus is on the main user interface functionalities. Actual interaction sessions are presented including schema creation, information loading, and information retrieval.", acknowledgement = ack-nhfb, affiliation = "Centro Ricerca di Automatica", affiliationaddress = "Milano, Italy", classification = "722.2; 723.2; 723.3; 723.5; 903.3; 903.4", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Abstracting; Browsing; Computer simulation; Data structures; Database systems; Graphical user interfaces; Hypermedia information systems; Hypertext; Information filtering; Information retrieval systems; Information services; Information technology; Interactive computer graphics; Multimedia; Multimedia object retrieval environment; Pattern matching; Schema graph; Subgraph; Systems analysis; Visual retrieval environment; Visualization", } @Article{Robey:1996:SPI, author = "Daniel Robey and Michael Newman", title = "Sequential Patterns in Information Systems Development: An Application of a Social Process Model", journal = j-TOIS, volume = "14", number = "1", pages = "30--63", month = jan, year = "1996", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80/tois/abstracts/robey.html", abstract = "We trace the process of developing and implementing a materials management system in one company over a 15-year period. Using a process research model developed by Newman and Robey, we identify 44 events in the process and define them as either encounters or episodes. Encounters are concentrated events, such as meetings and announcements, that separate episodes, which are events of longer duration. By examining the sequence of events over the 15 years of the case, we identify a pattern of repeated failure, followed by success. Our discussion centers on the value of detecting and displaying such patterns and the need for theoretical interpretation of recurring sequences of events. Five alternative theoretical perspectives, originally proposed by Kling, are used to interpret the sequential patterns identified by the model. We conclude that the form of the process model allows researchers who operate from different perspectives to enrich their understanding of the process of system development.", acknowledgement = ack-nhfb, affiliation = "Georgia State Univ", affiliationaddress = "Atlanta, GA, USA", classification = "722.4; 723.2; 723.3; 723.5; 903.3; 912.2", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Administrative data processing; Computer systems; Data structures; Database systems; Information retrieval systems; Management information systems; Materials management system; Process research model; Sequential patterns; Social process model; System implementation; Systems analysis", wwwtitle = "Sequential Patterns in Information Systems Development: An Application of a Process Model", } @Article{Taghva:1996:EMB, author = "Kazem Taghva and Julie Borsack and Allen Condit", title = "Evaluation of Model-Based Retrieval Effectiveness with {OCR} Text", journal = j-TOIS, volume = "14", number = "1", pages = "64--93", month = jan, year = "1996", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80/tois/abstracts/taghva.html", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", } @Article{Berghel:1996:EUE, author = "Hal Berghel and David Roach", title = "An Extension of {Ukkonen}'s Enhanced Dynamic Programming {ASM} Algorithm", journal = j-TOIS, volume = "14", number = "1", pages = "94--106", month = jan, year = "1996", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80/tois/abstracts/berghel.html", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", } @Article{Lee:1996:DRW, author = "Dik Lun Lee and Liming Ren", title = "Document Ranking on Weight-Partitioned Signature Files", journal = j-TOIS, volume = "14", number = "2", pages = "109--137", month = apr, year = "1996", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80/tois/abstracts/lee.html", abstract = "A signature file organization, called the weight-partitioned signature file, for supporting document ranking is proposed. It employs multiple signature files, each of which corresponds to one term frequency, to represent terms with different term frequencies. Words with the same term frequency in a document are grouped together and hashed into the signature file corresponding to that term frequency. This eliminates the need to record the term frequency explicitly for each word. We investigate the effect of false drops on retrieval effectiveness if they are not eliminated in the search process. We have shown that false drops introduce insignificant degradation on precision and recall when the false-drop probability is below a certain threshold. This is an important result since false-drop elimination could become the bottleneck in systems using fast signature file search techniques. We perform an analytical study on the performance of the weight-partitioned signature file under different search strategies and configurations. An optimal formula is obtained to determine for a fixed total storage overhead the storage to be allocated to each partition in order to minimize the effect of false drops on document ranks. Experiments were performed using a document collection to support the analytical results.", acknowledgement = ack-nhfb, affiliation = "Ohio State Univ", affiliationaddress = "Columbus, OH, USA", classification = "722.1; 723.2; 723.5; 903.3; 922.1", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Access method; Computer simulation; Document ranking; Document retrieval; Encoding (symbols); File organization; Information retrieval; Information retrieval systems; Performance; Probability; Storage allocation (computer); Superimposed coding; Text retrieval; Weight partitioned signature files", } @Article{Rowe:1996:ULO, author = "Neil C. Rowe", title = "Using Local Optimality Criteria for Efficient Information Retrieval with Redundant Information Filters", journal = j-TOIS, volume = "14", number = "2", pages = "138--174", month = apr, year = "1996", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80/tois/abstracts/rowe.html", abstract = "We consider information retrieval when the data --- for instance, multimedia --- is computationally expensive to fetch. Our approach uses `information filters' to considerably narrow the universe of possibilities before retrieval. We are especially interested in redundant information filters that save time over more general but more costly filters. Efficient retrieval requires that decisions must be made about the necessity, order, and concurrent processing of proposed filters (an `execution plan'). We develop simple polynomial-time local criteria for optimal execution plans and show that most forms of concurrency are suboptimal with information filters. Although the general problem of finding an optimal execution plan is likely to be exponential in the number of filters, we show experimentally that our local optimality criteria, used in a polynomial-time algorithm, nearly always find the global optimum with 15 filters or less, a sufficient number of filters for most applications. Our methods require no special hardware and avoid the high processor idleness that is characteristic of massive-parallelism solutions to this problem. We apply our ideas to an important application, information retrieval of captioned data using natural-language understanding, a problem for which the natural-language processing can be the bottleneck if not implemented well.", acknowledgement = ack-nhfb, affiliation = "Naval Postgraduate Sch", affiliationaddress = "Monterey, CA, USA", classification = "721.1; 723.1; 723.2; 723.3; 903.3; 921.5", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Algorithms; Boolean algebra; Concurrency control; Conjunction; Information retrieval; Information retrieval systems; Natural language processing systems; Optimization; Performance; Query languages; Redundant information filters", } @Article{Jungclaus:1996:TLO, author = "Ralf Jungclaus and Gunter Saake and Thorsten Hartmann and Cristina Sernadas", title = "{TROLL} --- {A} Language for Object-Oriented Specification of Information Systems", journal = j-TOIS, volume = "14", number = "2", pages = "175--211", month = apr, year = "1996", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80/tois/abstracts/hartmann.html", abstract = "TROLL is a language particularly suited for the early stages of information system development, when the universe of discourse must be described. In TROLL the descriptions of the static and dynamic aspects of entities are integrated into object descriptions. Sublanguages for data terms, for first-order and temporal assertions, and for processes, are used to describe respectively the static properties, the behavior, and the evolution over time of objects. TROLL organizes system design through object-orientation and the support of abstractions such as classification, specialization, roles, and aggregation. Language features for state interactions and dependencies among components support the composition of the system from smaller modules, as does the facility of defining interfaces on top of object descriptions.", acknowledgement = ack-nhfb, affiliation = "Deutsche Telekom", affiliationaddress = "Bonn, Ger", classification = "723.1; 723.1.1; 723.2", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Computer hardware description languages; Computer programming languages; Data processing; Language classifications; Language constructs and features; Management information systems; Object oriented specification; Software engineering; Systems analysis", } @Article{Grant:1996:CPM, author = "Rebecca A. Grant and Chris A. Higgins", title = "Computerized Performance Monitors as Multidimensional Systems: Derivation and Application", journal = j-TOIS, volume = "14", number = "2", pages = "212--235", month = apr, year = "1996", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80/tois/abstracts/grant.html", abstract = "An increasing number of companies are introducing computer technology into more aspects of work. Effective use of information systems to support office and service work can improve staff productivity, broaden a company's market, or dramatically change its business. It can also increase the extent to which work is computer mediated and thus within the reach of software known as Computerized Performance Monitoring and Control Systems (CPMCSs). Virtually all research has studied CPMCSs as unidimensional systems. Employees are described as `monitored' or `unmonitored' or as subject to `high,' `moderate,' or `low' levels of monitoring. Research that does not clearly distinguish among possible monitor design cannot explain how designs may differ in effect. Nor can it suggest how to design better monitors. A multidimensional view of CPMCSs describes monitor designs in terms of object of measurements, tasks measured, recipient of data, reporting period, and message content. This view is derived from literature in control systems, organizational behavior, and management information systems. The multidimensional view can then be incorporated into causal models to explain contradictory results of earlier CPMCS research.", acknowledgement = ack-nhfb, affiliation = "Univ of Victoria", affiliationaddress = "Victoria, BC, Can", classification = "723.1; 723.2; 723.5; 731.1; 912.4", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Computer applications; Computer software; Computerized performance evaluation; Computerized performance monitoring and control systems; Computerized work monitoring; Control systems; Management information systems; Monitoring; Personnel rating; Productivity; Systems analysis; Work monitoring system design", } @Article{Guglielmo:1996:NLR, author = "Eugene J. Guglielmo and Neil C. Rowe", title = "Natural-Language Retrieval of Images Based on Descriptive Captions", journal = j-TOIS, volume = "14", number = "3", pages = "237--267", month = jul, year = "1996", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80/tois/abstracts/guglielmo.html", abstract = "We describe a prototype intelligent information retrieval system that uses natural-language understanding to efficiently locate captioned data. Multimedia data generally require captions to explain their features and significance. Such descriptive captions often rely on long nominal compounds (strings of consecutive nouns) which create problems of disambiguating word sense. In our system, captions and user queries are parsed and interpreted to produce a logical form, using a detailed theory of the meaning of nominal compounds. A fine-grain match can then compare the logical form of the query to the logical forms for each caption. To improve system efficiency, we first perform a coarse-grain match with index files, using nouns and verbs extracted from the query. Our experiments with randomly selected queries and captions from an existing image library show an increase of 30\% in precision and 50\% in recall over the keyphrase approach currently used. Our processing times have a media of seven seconds as compared to eight minutes for the existing system, and our system is much easier to use.", acknowledgement = ack-nhfb, affiliation = "Monterey Bay Aquarium Research Inst (MBARI)", affiliationaddress = "Moss Landing, CA, USA", classification = "723.1.1; 723.2; 723.3; 723.4.1; 741; 903.3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Algorithms; Coarse grain match; Computational linguistics; Database systems; Descriptive captions; Fine grain match; Formal logic; Image processing; Information retrieval systems; Intelligent information retrieval system; Knowledge based systems; Knowledge representation; Multimedia; Natural language processing systems; Query languages", } @Article{Gottlob:1996:EOO, author = "Georg Gottlob and Michael Schrefl and Brigitte Rock", title = "Extending Object-Oriented Systems with Roles", journal = j-TOIS, volume = "14", number = "3", pages = "268--296", month = jul, year = "1996", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80/tois/abstracts/gottlob.html", abstract = "This article shows how class-based object-oriented systems can be extended to handle evolving objects well. Class hierarchies are complemented by role hierarchies, whose nodes represent role types an object classified in the root may take on. At any point in time, an entity is represented by an instance of the root and an instance of every role type whose role it currently plays. In a natural way, the approach extends traditional object-oriented concepts, such as classification, object identity, specialization, inheritance, and polymorphism in a natural way. The practicability of the approach is demonstrated by an implementation in Smalltalk. Smalltalk was chosen because it is widely known, which is not true for any particular class-based object-oriented database programming language. Roles can be provided in Smalltalk by adding a few classes. There is no need to modify the semantics of Smalltalk itself. Role hierarchies are mapped transparently onto ordinary classes. The presented implementation can easily be ported to object-oriented database programming languages based on Smalltalk, such as Gemstone's OPAL.", acknowledgement = ack-nhfb, affiliation = "Vienna Univ of Technology", affiliationaddress = "Wien, Austria", classification = "721.1; 723.1; 723.1.1; 723.2; 723.3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Class hierarchies; Computational linguistics; Computer programming languages; Data structures; Database systems; Object oriented databases; Object oriented programming; Role hierarchies; Semantics; Smalltalk programming language; Software engineering", } @Article{Gulla:1996:GEC, author = "Jon Atle Gulla", title = "A General Explanation Component for Conceptual Modeling in {CASE} Environments", journal = j-TOIS, volume = "14", number = "3", pages = "297--329", month = jul, year = "1996", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80/tois/abstracts/gulla.html", abstract = "In information systems engineering, conceptual models are constructed to assess existing information systems and work out requirements for new ones. As these models serve as a means for communication between customers and developers, it is paramount that both parties understand the models, as well as that the models form a proper basis for the subsequent design and implementation of the systems. New CASE environments are now experimenting with formal modeling languages and various techniques for validating conceptual models, though it seems difficult to come up with a technique that handles the linguistic barriers between the parties involved in a satisfactory manner. In this article, we discuss the theoretical basis of an explanation component implemented for the PPP CASE environment. This component integrates other validation techniques and provides a very flexible natural-language interface to complex model information. It describes properties of the modeling language and the conceptual models in terms familiar to users, and the explanations can be combined with graphical model views. When models are executed, it can justify requested inputs and explain computed outputs by relating trace information to properties of the models.", acknowledgement = ack-nhfb, classification = "721.1; 723.1; 723.1.1; 723.2; 723.3; 723.5", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Artificial intelligence; Computational linguistics; Computer aided software engineering; Computer graphics; Computer simulation; Computer simulation languages; Conceptual modeling; Database systems; Formal languages; Information systems engineering; Natural language processing systems; Program documentation; Validation techniques", wwwtitle = "A General Explanation Component for Conceptual Modeling in {CASE} Environment", } @Article{Friedman:1996:BCS, author = "Batya Friedman and Helen Nissenbaum", title = "Bias in Computer Systems", journal = j-TOIS, volume = "14", number = "3", pages = "330--347", month = jul, year = "1996", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80/tois/abstracts/friedman.html", abstract = "From an analysis of actual cases, three categories of bias in computer systems have been developed: preexisting, technical, and emergent. Preexisting bias has its roots in social institutions, practices, and attitudes. Technical bias arises from technical constraints or considerations. Emergent bias arises in a context of use. Although others have pointed to bias in particular computer systems and have noted the general problem, we know of no comparable work that examines this phenomenon comprehensively and which offers a framework for understanding and remedying it. We conclude by suggesting that freedom from bias should be counted among the select set of criteria --- including reliability, accuracy, and efficiency --- according to which the quality of systems in use in society should be judged.", acknowledgement = ack-nhfb, affiliation = "Colby Coll", affiliationaddress = "Waterville, ME, USA", classification = "461.4; 722.4; 723.2; 901.1; 901.1.1; 901.4", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Computer ethics; Computer systems; Human values; Man machine systems; Philosophical aspects; Reliability; Social aspects; Social computing; Social impact; Social sciences computing; Societies and institutions; Software engineering; Standards; Systems analysis", wwwpages = "330--346", wwwtitle = "Bias in Computer Science", } @Article{Moffat:1996:SII, author = "Alistair Moffat and Justin Zobel", title = "Self-Indexing Inverted Files for Fast Text Retrieval", journal = j-TOIS, volume = "14", number = "4", pages = "349--379", month = oct, year = "1996", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80/tois/abstracts/moffat.html", abstract = "Query-processing costs on large text databases are dominated by the need to retrieve and scan the inverted list of each query term. Retrieval time for inverted lists can be greatly reduced by the use of compression, but this adds to the CPU time required. Here we show that the CPU component of query response time for conjunctive Boolean queries and for informal ranked queries can be similarly reduced, at little cost in terms of storage, by the inclusion of an internal index in each compressed inverted list. This method has been applied in a retrieval system for a collection of nearly two million short documents. Our experimental results show that the self-indexing strategy adds less than 20\% to the size of the compressed inverted file, which itself occupies less than 10\% of the indexed text, yet can reduce processing time for Boolean queries of 5-10 terms to under one fifth of the previous cost. Similarly, ranked queries of 40-50 terms can be evaluated in as little as 25\% of the previous time, with little or no loss of retrieval effectiveness.", acknowledgement = ack-nhfb, affiliation = "Univ of Melbourne", affiliationaddress = "Parkville, Aust", classification = "716.1; 722.1; 723.2; 723.3; 903.1; 903.3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Boolean queries; Data compression; Data storage equipment; File organization; Full text retrieval; Index compression; Indexing (of information); Information retrieval; Information retrieval systems; Inverted file; Query languages; Query processing; Self indexing", } @Article{Oberweis:1996:ISB, author = "Andreas Oberweis and Peter Sander", title = "Information System Behavior Specification by High-Level {Petri} Nets", journal = j-TOIS, volume = "14", number = "4", pages = "380--420", month = oct, year = "1996", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80/tois/abstracts/oberweis.html", abstract = "The specification of an information system should include a description of structural system aspects as well as a description of the system behavior. In this article, we show how this can be achieved by high-level Petri nets --- namely, the so-called NR/T-nets (Nested-Relation\slash Transition Nets). In NR/T-nets, the structural part is modeled by nested relations, and the behavioral part is modeled by a novel Petri net formalism. Each place of a net represents a nested relation scheme, and the marking of each place is given as a nested relation of the respective type. Insert and delete operations in a nested relational database (NF2-database) are expressed by transitions in a net. These operations may operate not only on whole tuples of a given relation, but also on `subtuples' of existing tuples. The arcs of a net are inscribed with so-called Filter Tables, which allow (together with an optional logical expression as transition inscription) conditions to be formulated on the specified (sub-) tuples. The occurrence rule for NR/T-net transitions is defined by the operations union, intersection, and `negative' in lattices of nested relations. The structure of an NR/T-net, together with the occurrence rule, defines classes of possible information system procedures, i.e., sequences of (possibly concurrent) operations in an information system.", acknowledgement = ack-nhfb, affiliation = "Universitaet Karlsruhe", affiliationaddress = "Karlsruhe, Ger", classification = "721.2; 723.1.1; 723.3; 723.5; 903.3; 921.4", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Behavior specification; Complex objects; Computer aided logic design; Computer hardware description languages; Conceptual design; Data manipulation languages; Data structures; Information retrieval systems; Nested relations; Petri nets; Query languages; Transition nets", } @Article{Cheung:1996:MAG, author = "Waiman Cheung and Cheng Hsu", title = "The Model-Assisted Global Query System for Multiple Databases in Distributed Enterprises", journal = j-TOIS, volume = "14", number = "4", pages = "421--470", month = oct, year = "1996", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80/tois/abstracts/cheung.html", abstract = "Today's enterprises typically employ multiple information systems, which are independently developed, locally administered, and different in logical or physical designs. Therefore, a fundamental challenge in enterprise information management is the sharing of information for enterprise users across organizational boundaries; this requires a global query system capable of providing on-line intelligent assistance to users. Conventional technologies, such as schema-based query languages and hard-coded schema integration, are not sufficient to solve this problem. This article develops a new approach, a `model-assisted global query system,' that utilizes an on-line repository of enterprise metadata --- the Metadatabase --- to facilitate global query formulation and processing with certain desirable properties such as adaptiveness and open-systems architecture. A definitional model characterizing the various classes and roles of the required metadata as knowledge for the system is presented. The significance of possessing this knowledge (via a Metadatabase) toward improving the global query capabilities available previously is analyzed. On this basis, a direct method using model traversal and a query language using global model constructs are developed along with other new methods required for this approach. It is then tested through a prototype system in a computer-integrated manufacturing (CIM) settings.", acknowledgement = ack-nhfb, affiliation = "Chinese Univ of Hong Kong", affiliationaddress = "Shatin, Hong Kong", classification = "721.2; 722.2; 722.4; 723.1.1; 723.3; 921", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Data storage equipment; Distributed database systems; Enterprise information management; Global query system; Hard coded schema integration; Information retrieval; Logic design; Mathematical models; Metadatabases; Model traversal; Multiple information systems; Online intelligent assistance; Online systems; Query languages; User interfaces", wwwtitle = "The Model-Assisted Global Query System for Multiple Databases in Distributed Enterprise", } @Article{Anonymous:1996:AI, author = "Anonymous", title = "1996 Author Index", journal = j-TOIS, volume = "14", number = "4", pages = "471--472", month = oct, year = "1996", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 16:21:56 MST 1999", bibsource = "http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80/tois/abstracts/cheung.html", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Wiil:1997:HHS, author = "Uffe K. Wiil and John J. Leggett", title = "{Hyperform}: a Hypermedia System Development Environment", journal = j-TOIS, volume = "15", number = "1", pages = "1--31", month = jan, year = "1997", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80/tois/abstracts/wiil.html", abstract = "Development of hypermedia systems is a complex matter. The current trend toward open, extensible, and distributed multiuser hypermedia systems adds additional complexity to the development process. As a means of reducing this complexity, there has been an increasing interest in hyperbase management systems that allow hypermedia system developers to abstract from the intricacies and complexity of the hyperbase layer and fully attend to application and user interface issues. Design, development, and deployment experiences of a dynamic, open, and distributed multiuser hypermedia system development environment called Hyperform is presented. Hyperform is based on the concepts of extensibility, tailorability, and rapid prototyping of hypermedia system services. Open, extensible hyperbase management systems permit hypermedia system developers to tailor hypermedia functionality for specific applications and to serve as a platform for research. The Hyperform development environment is comprised of multiple instances of four component types: (1) a hyperbase management system server, (2) a tool integrator, (3) editors, and (4) participating tools. Hyperform has been deployed in Unix environments, and experiments have shown that Hyperform greatly reduces the effort required to provide customized hyperbase management system support for distributed multiuser hypermedia systems.", acknowledgement = ack-nhfb, affiliation = "Aalborg Univ", affiliationaddress = "Den", classification = "722.4; 723.1; 723.2; 723.3; 723.5; 903.3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Advanced hypermedia system architecture; Computational complexity; Computer architecture; Data structures; Database systems; Extensible hyperbase management system; Hyperform; Information retrieval systems; Object oriented extension language; Object oriented programming; Rapid prototyping; System theory", } @Article{Fuhr:1997:PRA, author = "Norbert Fuhr and Thomas R{\"o}lleke", title = "A Probabilistic Relational Algebra for the Integration of Information Retrieval and Database Systems", journal = j-TOIS, volume = "15", number = "1", pages = "32--66", month = jan, year = "1997", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80/tois/abstracts/fuhr.html", abstract = "We present a probabilistic relational algebra (PRA) which is a generalization of standard relational algebra. In PRA, tuples are assigned probabilistic weights giving the probability that a tuple belongs to a relation. Based on intensional semantics, the tuple weights of the result of a PRA expression always conform to the underlying probabilistic model. We also show for which expressions extensional semantics yields the same results. Furthermore, we discuss complexity issues and indicate possibilities for optimization. With regard to databases, the approach allows for representing imprecise attribute values, whereas for information retrieval, probabilistic document indexing and probabilistic search term weighting can be modeled. We introduce the concept of vague predicates which yield probabilistic weights instead of Boolean values, thus allowing for queries with vague selection conditions. With these features, PRA implements uncertainty and vagueness in combination with the relational model.", acknowledgement = ack-nhfb, affiliation = "Univ of Dortmund", affiliationaddress = "Ger", classification = "721.1; 723.2; 723.3; 903.3; 921.5; 922.1", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Computational complexity; Computational linguistics; Computer simulation; Data structures; Hypertext retrieval; Imprecise data; Indexing (of information); Information retrieval; Logical retrieval model; Optimization; Probabilistic relational algebra; Probabilistic retrieval; Probability; Query languages; Relational data model; Relational database systems; Uncertain data; Vague predicates", wwwauthor = "N. Fuhr and T. Rolleke", } @Article{Rus:1997:CIC, author = "Daniela Rus and Devika Subramanian", title = "Customizing Information Capture and Access", journal = j-TOIS, volume = "15", number = "1", pages = "67--101", month = jan, year = "1997", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80/tois/abstracts/rus.html", abstract = "This article presents a customizable architecture for software agents that capture and access information in large, heterogeneous, distributed electronic repositories. The key idea is to exploit underlying structure at various levels of granularity to build high-level indices with task-specific interpretations. Information agents construct such indices and are configured as a network of reusable modules called structure detectors and segmenters. We illustrate our architecture with the design and implementation of smart information filters in two contexts: retrieving stock market data from Internet newsgroups and retrieving technical reports from Internet FTP sites.", acknowledgement = ack-nhfb, affiliation = "Dartmouth Coll", affiliationaddress = "NH, USA", classification = "716.1; 722.3; 722.4; 723.1; 723.2; 903.3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Computer architecture; Computer networks; Computer software; Data acquisition; Information gathering; Information retrieval systems; Information theory; Software agents; Table recognition", } @Article{Entlich:1997:MDL, author = "Richard Entlich and Lorrin Garson and Michael Lesk and Lorraine Normore and Jan Olsen and Stuart Weibel", title = "Making a Digital Library: The Contents of the {CORE} Project", journal = j-TOIS, volume = "15", number = "2", pages = "103--123", month = apr, year = "1997", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80/tois/abstracts/entlich.html", abstract = "The CORE (Chemical Online Retrieval Experiment) project is a library of primary journal articles in chemistry. Any library has an inside and an outside; in this article we describe the inside of the library and the methods for building the system and accumulating the database. A later article will describe the outside (user experiences). Among electronic-library projects, the CORE project is unusual in that it has both ASCII derived from typesetting and image data for all its pages, and among experimental electronic-library projects, it is unusually large. We describe here (a) the processes of scanning and analyzing about 400,000 pages of primary journal material, (b) the conversion of a similar amount of textual database material, (c) the linking of these two data sources, and (d) the indexing of the text material.", acknowledgement = ack-nhfb, affiliation = "Cornell Univ", affiliationaddress = "NY, USA", classification = "722.2; 723.3; 903.1; 903.3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Chemical online retrieval experiment (core) project; Database systems; Indexing (of information); Information retrieval systems; User interfaces", } @Article{Manber:1997:TCS, author = "Udi Manber", title = "A Text Compression Scheme That Allows Fast Searching Directly in the Compressed File", journal = j-TOIS, volume = "15", number = "2", pages = "124--136", month = apr, year = "1997", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80/tois/abstracts/manber.html", abstract = "A new text compression scheme is presented in this article. The main purpose of this scheme is to speed up string matching by searching the compressed file directly. The scheme requires no modification of the string-matching algorithm, which is used as a black box; any string-matching procedure can be used. Instead, the pattern is modified; only the outcome of the matching of the modified pattern against the compressed file is decompressed. Since the compressed file is smaller than the original file, the search is faster both in terms of I/O time and processing time than a search in the original file. For typical text files, we achieve about 30\% reduction of space and slightly less of search time. A 30\% space saving is not competitive with good text compression schemes, and thus should not be used where space is the predominant concern. The intended applications of this scheme are files that are searched often, such as catalogs, bibliographic files, and address books. Such files are typically not compressed, but with this scheme they can remain compressed indefinitely, saving space while allowing faster search at the same time. A particular application to an information retrieval system that we developed is also discussed.", acknowledgement = ack-nhfb, affiliation = "Univ of Arizona", affiliationaddress = "Tucson, AZ, USA", classification = "723; 723.2; 723.5; 903.3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Algorithms; Data compression; Information retrieval systems; Pattern recognition; String matching algorithms", } @Article{Dunlop:1997:EAN, author = "Mark D. Dunlop", title = "The Effect of Accessing Nonmatching Documents on Relevance Feedback", journal = j-TOIS, volume = "15", number = "2", pages = "137--153", month = apr, year = "1997", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80/tois/abstracts/dunlop.html", abstract = "Traditional information retrieval (IR) systems only allow users access to documents that match their current query, and therefore, users can only give relevance feedback on matching documents (or those with a matching strength greater than a set threshold). This article shows that, in systems that allow access to nonmatching documents (e.g., hybrid hypertext and information retrieval systems), the strength of the effect of giving relevance feedback varies between matching and nonmatching documents. For positive feedback the results shown here are encouraging, as they can be justified by an intuitive view of the process. However, for negative feedback the results show behavior that cannot easily be justified and that varies greatly depending on the model of feedback used.", acknowledgement = ack-nhfb, affiliation = "Univ of Glasgow", affiliationaddress = "Glasgow, UK", classification = "731.1; 903.3; 921; 921.1; 922.1", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Feedback; Free text information retrieval; Information retrieval systems; Mathematical models; Probability; Vectors", } @Article{Gladney:1997:ACL, author = "H. M. Gladney", title = "Access Control for Large Collections", journal = j-TOIS, volume = "15", number = "2", pages = "154--194", month = apr, year = "1997", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80/tois/abstracts/gladney.html", abstract = "Efforts to place vast information resources at the fingertips of each individual in large user populations must be balanced by commensurate attention to information protection. For centralized operational systems in controlled environments, external administrative controls may suffice. For distributed systems with less-structured tasks, more-diversified information, and a heterogeneous user set, the computing system must administer enterprise-chosen access control policies. One kind of resource is a digital library that emulates massive collections of paper and other physical media for clerical, engineering, and cultural applications. This article considers the security requirements for such libraries and proposes an access control method that mimics organizational practice by combining a subject tree with ad hoc role granting that controls privileges for many operations independently, that treats (all but one) privileged roles (e.g., auditor, security officer) like every other individual authorization, and that binds access control information to objects indirectly for scaling, flexibility, and reflexive protection. We sketch a realization and show that it will perform well, generalizes many deployed proposed access control policies, and permits individual data centers to implement other models economically and without disruption.", acknowledgement = ack-nhfb, affiliation = "IBM Almaden Research Cent", affiliationaddress = "San Jose, CA, USA", classification = "722.4; 723.2; 723.3; 903.3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Access control; Digital library; Distributed computer systems; Distributed database systems; Information retrieval systems; Security of data", } @Article{Dreilinger:1997:ESS, author = "Daniel Dreilinger and Adele E. Howe", title = "Experiences with Selecting Search Engines Using Metasearch", journal = j-TOIS, volume = "15", number = "3", pages = "195--222", month = jul, year = "1997", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80/tois/abstracts/dreilinger.html", abstract = "Search engines are among the most useful and high-profile resources on the Internet. The problem of finding information on the Internet has been replaced with the problem of knowing where search engines are, what they are designed to retrieve, and how to use them. This article describes and evaluates SavvySearch, a metasearch engine designed to intelligently select and interface with multiple remote search engines. The primary metasearch issue examined is the importance of carefully selecting and ranking remote search engines for user queries. We studied the efficacy of SavvySearch's incrementally acquired metaindex approach to selecting search engines by analyzing the effect of time and experience on performance. We also compared the metaindex approach to the simpler categorical approach and showed how much experience is required to surpass the simple scheme.", acknowledgement = ack-nhfb, affiliation = "MIT Media Lab", affiliationaddress = "Cambridge, MA, USA", classification = "722.2; 722.3; 723.3; 723.4; 723.4.1; 903.3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Inference engines; Information retrieval systems; Interfaces (computer); Internet; Learning algorithms; Learning systems; Query languages; Search engines; Software package SavvySearch; Wide area networks", } @Article{Tomasic:1997:DSE, author = "Anthony Tomasic and Luis Gravano and Calvin Lue and Peter Schwarz and Laura Haas", title = "Data Structures for Efficient Broker Implementation", journal = j-TOIS, volume = "15", number = "3", pages = "223--253", month = jul, year = "1997", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80/tois/abstracts/tomasic.html", abstract = "With the profusion of text databases on the Internet, it is becoming increasingly hard to find the most useful databases for a given query. To attack this problem, several existing and proposed systems employ brokers to direct user queries, using a local database of summary information about the available databases. This summary information must effectively distinguish relevant databases and must be compact while allowing efficient access. We offer evidence that one broker, GlOSS, can be effective at locating databases of interest even in a system of hundreds of databases and can examine the performance of accessing the GlOSS summaries for two promising storage methods: the grid file and partitioned hashing. We show that both methods can be tuned to provide good performance for a particular workload (within a broad range of workloads), and we discuss the tradeoffs between the two data structures. As a side effect of our work, we show that grid files are more broadly applicable than previously thought; in particular, we show that by varying the policies used to construct the grid file we can provide good performance for a wide range of workloads even when storing highly skewed data.", acknowledgement = ack-nhfb, affiliation = "INRIA Rocquencourt", affiliationaddress = "Le Chesnay, Fr", classification = "722.1; 722.2; 723.2; 723.3; 903.3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Data storage equipment; Data structures; Distributed database systems; Grid files; Information retrieval; Internet; Partitioned hashing; Query languages; Text databases; User interfaces", } @Article{Bookstein:1997:MWO, author = "A. Bookstein and S. T. Klein and T. Raita", title = "Modeling Word Occurrences for the Compression of Concordances", journal = j-TOIS, volume = "15", number = "3", pages = "254--290", month = jul, year = "1997", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80/tois/abstracts/bookstein.html", abstract = "An earlier paper developed a procedure for compressing concordances, assuming that all elements occurred independently. The models introduced in that paper are extended here to take the possibility of clustering into account. The concordance is conceptualized as a set of bitmaps, in which the bit locations represent documents, and the one-bits represent the occurrence of given terms. Hidden Markov Models (HMMs) are used to describe the clustering of the one-bits. However, for computational reasons, the HMM is approximated by traditional Markov models. A set of criteria is developed to constrain the allowable set of n-state models, and a full inventory is given for n less than or equal 4. Graph-theoretic reduction and complementation operations are defined among the various models and are used to provide a structure relating the models studied. Finally, the new methods were tested on the concordances of the English Bible and of two of the world's largest full-text retrieval system: the Tr{\'e}sor de la Langue Fran{\c{c}}aise and the Responsa Project.", acknowledgement = ack-nhfb, affiliation = "Univ of Chicago", affiliationaddress = "Chicago, IL, USA", classification = "723.2; 903.3; 921; 921.4; 921.6; 922.1", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Approximation theory; Classification (of information); Computational methods; Data compression; Data storage equipment; Data structures; Full text retrieval systems; Graph theory; Hidden Markov models (HMM); Information retrieval systems; Markov processes; Mathematical models", wwwpages = "254--291", } @Article{Cohen:1997:RHF, author = "Jonathan D. Cohen", title = "Recursive Hashing Functions for $n$-Grams", journal = j-TOIS, volume = "15", number = "3", pages = "291--320", month = jul, year = "1997", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; http://www.acm.org/pubs/tois/toc.html; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80/tois/abstracts/cohen.html", abstract = "Many indexing, retrieval, and comparison methods are based on counting or cataloguing n-grams in streams of symbols. The fastest method of implementing such operations is through the use of hash tables. Rapid hashing of consecutive n-grams is best done using a recursive hash function, in which the hash value of the current n-gram is derived from the hash value of its predecessor. This article generalizes recursive hash functions found in the literature and proposes new methods offering superior performance. Experimental results demonstrate substantial speed improvement over conventional approaches, while retaining near-ideal hash value distribution.", acknowledgement = ack-nhfb, affiliation = "Natl Security Agency", affiliationaddress = "Fort Meade, MD, USA", classification = "721.1; 723.2; 903.1; 903.3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Computational complexity; Data structures; Indexing (of information); Information retrieval; Recursive functions; Recursive hashing functions", } @Article{Kimbrough:1997:AMP, author = "Steven O. Kimbrough and Scott A. Moore", title = "On Automated Message Processing in Electronic Commerce and Work Support Systems: Speech Act Theory and Expressive Felicity", journal = j-TOIS, volume = "15", number = "4", pages = "321--367", month = oct, year = "1997", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Electronic messaging, whether in an office environment or for electronic commerce, is normally carried out in natural language, even when supported by information systems. For a variety of reasons, it would be useful if electronic messaging systems could have semantic access to, that is, access to the meanings and contents of, the messages they process. Given that natural language understanding is not a practicable alternative, there remain three approaches to delivering systems with semantic access: electronic data interchange (EDI), tagged messages, and the development of a formal language for business communication (FLBC). We favor the latter approach. In this article we compare and contrast these three approaches, present a theoretical basis for an FLBC (using speech act theory), and describe a prototype implementation.", acknowledgement = ack-nhfb, affiliation = "Univ of Pennsylvania", affiliationaddress = "Philadelphia, PA, USA", classification = "721.1; 722.3; 723.1; 723.4; 751.5", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Artificial intelligence; Data communication systems; Electronic commerce; Formal language for business communication; Formal languages; Knowledge representation; Software prototyping; Speech act theory; Speech processing", } @Article{Mostafa:1997:MAI, author = "J. Mostafa and S. Mukhopadhyay and W. Lam and M. Palakal", title = "A Multilevel Approach to Intelligent Information Filtering: Model, System, and Evaluation", journal = j-TOIS, volume = "15", number = "4", pages = "368--399", month = oct, year = "1997", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "In information-filtering environments, uncertainties associated with changing interests of the user and the dynamic document stream must be handled efficiently. In this article, a filtering model is proposed that decomposes the overall task into subsystem functionalities and highlights the need for multiple adaptation techniques to cope with uncertainties. A filtering system, SIFTER, has been implemented based on the model, using established techniques in information retrieval and artificial intelligence. These techniques include document representation by a vector-space model, document classification by unsupervised learning, and user modeling by reinforcement learning. The system can filter information based on content and a user's specific interests. The user's interests are automatically learned with only limited user intervention in the form of optional relevance feedback for documents. We also describe experimental studies conducted with SIFTER to filter computer and information science documents collected from the Internet and commercial database services. The experimental results demonstrate that the system performs very well in filtering documents in a realistic problem setting.", acknowledgement = ack-nhfb, affiliation = "Indiana Univ", affiliationaddress = "Bloomington, IN, USA", classification = "723.2; 723.3; 723.4; 723.5; 903.3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Artificial intelligence; Computer simulation; Data processing; Database systems; Information retrieval systems; Intelligent information filtering; Learning systems; Reinforcement learning; Unsupervised learning", } @Article{Navarro:1997:PNM, author = "Gonzalo Navarro and Ricardo {Baeza- Yates}", title = "Proximal Nodes: a Model to Query Document Databases by Content and Structure", journal = j-TOIS, volume = "15", number = "4", pages = "400--435", month = oct, year = "1997", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "A model to query document databases by both their content and structure is presented. The goal is to obtain a query language that is expressive in practice while being efficiently implementable, features not present at the same time in previous work. The key ideas of the model are a set-oriented query language based on operations on nearby structure elements of one or more hierarchies, together with content and structural indexing and bottom-up evaluation. The model is evaluated in regard to expressiveness and efficiency, showing that it provides a good trade-off between both goals. Finally, it is shown how to include in the model other media different from text.", acknowledgement = ack-nhfb, affiliation = "Univ of Chile", affiliationaddress = "Santiago, Chile", classification = "461.4; 723.1; 723.1.1; 723.2; 723.3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Algorithms; Computer programming languages; Data processing; Data structures; Hierarchical documents; Human engineering; Man machine systems; Performance; Query languages; Structured text; Text algebras", } @Article{Anonymous:1997:AI, author = "Anonymous", title = "1997 Author Index", journal = j-TOIS, volume = "15", number = "4", pages = "436--437", month = oct, year = "1997", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:02:45 MST 1999", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Stotts:1998:HAV, author = "P. David Stotts and Richard Furuta and Cyrano {Ruiz Cabarrus}", title = "Hyperdocuments as Automata: Verification of Trace-Based Browsing Properties by Model Checking", journal = j-TOIS, volume = "16", number = "1", pages = "1--30", month = jan, year = "1998", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "We present a view of hyperdocuments in which each document encodes its own browsing semantics in its links. This requires a mental shift in how a hyperdocument is thought of abstractly. Instead of treating the links of a document as defining a static directed graph, they are thought of as defining an abstract program, termed the links automaton of the document. A branching temporal logic notation, termed HTL*, is introduced for specifying properties a document should exhibit during browsing. An automated program verification technique called model checking is used to verify that browsing specifications in a subset of HTL* are met by the behavior defined in the links automaton. We illustrate the generality of these techniques by applying them first to several Trellis documents and then to a Hyperties document.", acknowledgement = ack-nhfb, affiliation = "Univ of North Carolina", affiliationaddress = "Chapel Hill, NC, USA", classification = "721.1; 723.2; 921.4", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Automata theory; Browsing semantics; Computation theory; Encoding (symbols); Graph theory; Hyperdocuments; Hypermedia; Model checking", } @Article{Vujovic:1998:EAF, author = "N. Vujovic and D. Brzakovic", title = "Evaluation of an Algorithm for Finding a Match of a Distorted Texture Pattern in a Large Image Database", journal = j-TOIS, volume = "16", number = "1", pages = "31--60", month = jan, year = "1998", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Evaluation of an algorithm for finding a match for a random texture pattern in a large image database is presented. The algorithm was designed assuming that the random pattern may be subject to misregistration relative to its representation in the database and assuming that it may have missing parts. The potential applications involve authentication of legal documents, bank notes, or credit cards, where thin fibers are embedded randomly into the document medium during medium fabrication. The algorithm achieves image matching by a three-step hierarchical procedure, which starts by matching parts of fiber patterns while solving the misregistration problem and ends up by matching complete fiber patterns. Performance of the algorithm is studied both theoretically and experimentally. Theoretical analysis includes the study. of the probability that two documents have the same pattern, and the probability of the algorithm establishing a wrong match, as well as the algorithm's performance in terms of processing time. Experiments involving over 250,000 trials using databases of synthetic documents, containing up to 100,000 documents, were used to confirm theoretical predictions. In addition, experiments involving a database containing real images were conducted in order to confirm that the algorithm has potential in real applications.", acknowledgement = ack-nhfb, affiliation = "Lehigh Univ", affiliationaddress = "Bethlehem, PA, USA", classification = "723.3; 731.1", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Algorithms; Database systems; Identification (control systems); Image database; Image matching; Image processing", } @Article{Xu:1998:CBS, author = "Jinxi Xu and W. Bruce Croft", title = "Corpus-Based Stemming Using Cooccurrence of Word Variants", journal = j-TOIS, volume = "16", number = "1", pages = "61--81", month = jan, year = "1998", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Stemming is used in many information retrieval (IR) systems to reduce variant word forms to common roots. It is one of the simplest applications of natural language processing to IR and is one of the most effective in terms of user acceptance and consistency, though small retrieval improvements. Current stemming techniques do not, however, reflect the language use in specific corpora, and this can lead to occasional serious retrieval failures. We propose a technique for using corpus-based word variant cooccurrence statistics to modify or create a stemmer. The experimental results generated using English newspaper and legal text and Spanish text demonstrate the viability of this technique and its advantages relative to conventional approaches that only employ morphological rules.", acknowledgement = ack-nhfb, affiliation = "Univ of Massachusetts", affiliationaddress = "Amherst, MA, USA", classification = "723.3; 903.3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Algorithms; Cooccurrence; Corpus analysis; Database systems; Failure analysis; Information retrieval; Stemming", } @Article{Romm:1998:EMC, author = "Celia T. Romm and Nava Pliskin", title = "Electronic Mail as a Coalition-Building Information Technology", journal = j-TOIS, volume = "16", number = "1", pages = "82--100", month = jan, year = "1998", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "One of the most intriguing lines of research within the literature on diffusion of information technologies (IT) is the study of the power and politics of this process. The major objective of this article is to build on the work of Kling and Markus on power and IT, by extending their perspective to email. To demonstrate how email can be used for political purposes within an organizational context, a case study is presented. The case study describes a series of events which took place in a university. In the case, email was used by a group of employees to stage a rebellion against the university president. The discussion demonstrates that email features make it amenable to a range of political uses. The article is concluded with a discussion of the implications from this case to email research and practice.", acknowledgement = ack-nhfb, affiliation = "Univ of Wollongong", affiliationaddress = "Wollongong, Aust", classification = "903; 903.2", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Coalition building information technology; Electronic mail; Information dissemination; Information science; Information technology", } @Article{Wilbur:1998:KMH, author = "W. John Wilbur", title = "The Knowledge in Multiple Human Relevance Judgments", journal = j-TOIS, volume = "16", number = "2", pages = "101--126", month = apr, year = "1998", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "We show first that the pooling of multiple human judgments of relevance provides a predictor of relevance that is superior to that obtained from a single human's relevance judgments. A learning algorithm applied to a set of relevance judgments obtained from a single human would be expected to perform on new material at a level somewhat below that human. However, we examine two learning methods which when trained on the superior source of pooled human relevance judgments are able to perform at the level of a single human on new material. All performance comparisons are based on an independent human judge. Both algorithms function by producing term weights --- one by a log odds calculation and the other by producing a least-squares fit to human relevance ratings. Some characteristics of the algorithms are examined.", acknowledgement = ack-nhfb, affiliation = "Natl Cent for Biotechnology Information (NCBI)", affiliationaddress = "Bethesda, MD, USA", classification = "903; 903.3; 921.6", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Algorithms; Information retrieval; Information technology; Inverse document frequency weights; Least squares approximations", } @Article{Hicks:1998:HVC, author = "David L. Hicks and John J. Leggett and Peter J. Nurnberg and John L. Schnase", title = "A Hypermedia Version Control Framework", journal = j-TOIS, volume = "16", number = "2", pages = "127--160", month = apr, year = "1998", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The areas of application of hypermedia technology, combined with the capabilities that hypermedia provides for manipulating structure, create an environment in which version control is very important. A hypermedia version control framework has been designed to specifically address the version control problem in open hypermedia environments. One of the primary distinctions of the framework is the partitioning of hypermedia version control functionality into intrinsic and application-specific categories. The version control framework has been used as a model for the design of version control services for a hyperbase management system that provides complete version support for both data and structural entities. In addition to serving as a version control model for open hypermedia environments, the framework offers a clarifying and unifying context in which to examine the issues of version control in hypermedia.", acknowledgement = ack-nhfb, affiliation = "Knowledge Systems", affiliationaddress = "Export, PA, USA", classification = "723.2; 723.3; 912.2", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Computer operating systems; Database systems; Hipermedia; Hyperbase management systems; Management; Management information systems", } @Article{Belussi:1998:SSJ, author = "Alberto Belussi and Christos Faloutsos", title = "Self-Spatial Join Selectivity Estimation Using Fractal Concepts", journal = j-TOIS, volume = "16", number = "2", pages = "161--201", month = apr, year = "1998", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The problem of selectivity estimation for queries of nontraditional databases is still an open issue. In this article, we examine the problem of selectivity estimation for some types of spatial queries in databases containing real data. We have shown earlier [Faloutsos and Kamel 1994] that real point sets typically have a non-uniform distribution, violating consistently the uniformity and independence assumptions. Moreover, we demonstrated that the theory of fractals can help to describe real point sets. In this article we show how the concept of fractal dimension, i.e., (non-integer) dimension, can lead to the solution for the selectivity estimation problem in spatial databases. Among the infinite family of fractal dimensions, we consider here the Hausdorff fractal dimension D0 and the `Correlation' fractal dimension D2. Specifically, we show that (a) the average number of neighbors for a given point set follows a power law, with D2 as exponent, and (b) the average number of nonempty range queries follows a power law with E --- D0 as exponent (E is the dimension of the embedding space). We present the formulas to estimate the selectivity for `biased' range queries, for self-spatial joins, and for the average number of nonempty range queries. The result of some experiments on real and synthetic point sets are shown. Our formulas achieve very low relative errors, typically about 10\%, versus 40\%-100\% of the formulas that are based on the uniformity and independence assumptions.", acknowledgement = ack-nhfb, affiliation = "Politecnico di Milano", affiliationaddress = "Milan, Italy", classification = "722; 723.3; 921", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", journalabr = "ACM Trans Inf Syst", keywords = "Algorithms; Computer selection and evaluation; Database systems; Fractal dimension; Fractals; Selectivity estimation", } @Article{Ackerman:1998:AOM, author = "Mark S. Ackerman", title = "Augmenting Organizational Memory: a Field Study of {Answer Garden}", journal = j-TOIS, volume = "16", number = "3", pages = "203--224", month = jul, year = "1998", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Mon Jul 26 16:33:55 MDT 1999", bibsource = "http://www.acm.org/pubs/toc/; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80/pubs/citations/journals/tois/1998-16-3/p203-ackerman/", abstract = "A growing concern for organizations and groups has been to augment their knowledge and expertise. One such augmentation is to provide an organizational memory, some record of the organization's knowledge. However, relatively little is known about how computer systems might enhance organizational, group, or community memory. This article presents Answer Garden, a system for growing organizational memory. The article describes the system and its underlying implementation. It then presents findings from a field study of Answer Garden. The article discusses the usage data and qualitative evaluations from the field study, and then draws a set of lessons for next-generation organizational memory systems.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "performance; reliability", subject = "{\bf H.5.3} Information Systems, INFORMATION INTERFACES AND PRESENTATION, Group and Organization Interfaces. {\bf C.2.4} Computer Systems Organization, COMPUTER-COMMUNICATION NETWORKS, Distributed Systems, Distributed applications. {\bf H.1.2} Information Systems, MODELS AND PRINCIPLES, User/Machine Systems. {\bf H.3.3} Information Systems, INFORMATION STORAGE AND RETRIEVAL, Information Search and Retrieval. {\bf H.4.3} Information Systems, INFORMATION SYSTEMS APPLICATIONS, Communications Applications. {\bf H.5.2} Information Systems, INFORMATION INTERFACES AND PRESENTATION, User Interfaces. {\bf I.7.2} Computing Methodologies, DOCUMENT AND TEXT PROCESSING, Document Preparation, Hypertext/hypermedia. {\bf K.4.3} Computing Milieux, COMPUTERS AND SOCIETY, Organizational Impacts.", } @Article{Crestani:1998:SPK, author = "F. Crestani and C. J. {Van Rijsbergen}", title = "A Study of Probability Kinematics in Information Retrieval", journal = j-TOIS, volume = "16", number = "3", pages = "225--255", month = jul, year = "1998", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Mon Jul 26 16:33:55 MDT 1999", bibsource = "http://www.acm.org/pubs/toc/; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80/pubs/citations/journals/tois/1998-16-3/p225-crestani/", abstract = "We analyze the kinematics of probabilistic term weights at retrieval time for different Information Retrieval models. We present four models based on different notions of probabilistic retrieval. Two of these models are based on classical probability theory and can be considered as prototypes of models long in use in Information Retrieval, like the Vector Space Model and the Probabilistic Model. The two other models are based on a logical technique of evaluating the probability of a conditional called imaging; one is a generalization of the other. We analyze the transfer of probabilities occurring in the term space at retrieval time for these four models, compare their retrieval performance using classical test collections, and discuss the results. We believe that our results provide useful suggestions on how to improve existing probabilistic models of Information Retrieval by taking into consideration term-term similarity.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "experimentation; performance; theory", subject = "{\bf H.3.3} Information Systems, INFORMATION STORAGE AND RETRIEVAL, Information Search and Retrieval, Retrieval models. {\bf F.1.2} Theory of Computation, COMPUTATION BY ABSTRACT DEVICES, Modes of Computation, Probabilistic computation.", } @Article{Moffat:1998:ACR, author = "Alistair Moffat and Radford M. Neal and Ian H. Witten", title = "Arithmetic Coding Revisited", journal = j-TOIS, volume = "16", number = "3", pages = "256--294", month = jul, year = "1998", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Mon Jul 26 16:33:55 MDT 1999", bibsource = "http://www.acm.org/pubs/toc/; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80/pubs/citations/journals/tois/1998-16-3/p256-moffat/", abstract = "Over the last decade, arithmetic coding has emerged as an important compression tool. It is now the method of choice for adaptive coding on multisymbol alphabets because of its speed, low storage requirements, and effectiveness of compression. This article describes a new implementation of arithmetic coding that incorporates several improvements over a widely used earlier version by Witten, Neal, and Cleary, which has become a {\em de facto\/} standard. These improvements include fewer multiplicative operations, greatly extended range of alphabet sizes and symbol probabilities, and the use of low-precision arithmetic, permitting implementation by fast shift/add operations. We also describe a modular structure that separates the coding, modeling, and probability estimation components of a compression system. To motivate the improved coder, we consider the needs of a word-based text compression program. We report a range of experimental results using this and other models. Complete source code is available.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "algorithms; performance", subject = "{\bf E.4} Data, CODING AND INFORMATION THEORY, Data compaction and compression. {\bf E.1} Data, DATA STRUCTURES.", } @Article{Egenhofer:1998:MDN, author = "Max J. Egenhofer and A. Rashid B. M. Shariff", title = "Metric details for natural-language spatial relations", journal = j-TOIS, volume = "16", number = "4", pages = "295--321", month = oct, year = "1998", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Mon Jul 26 16:33:55 MDT 1999", bibsource = "http://www.acm.org/pubs/toc/; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80/pubs/citations/journals/tois/1998-16-4/p295-egenhofer/", abstract = "Spatial relations often are desired answers that a geographic information system (GIS) should generate in response to a user's query. Current GIS's provide only rudimentary support for processing and interpreting natural-language-like spatial relations, because their models and representations are primarily quantitative, while natural-language spatial relations are usually dominated by qualitative properties. Studies of the use of spatial relations in natural language showed that topology accounts for a significant portion of the geometric properties. This article develops a formal model that captures {\em metric details\/} for the description of natural-language spatial relations. The metric details are expressed as refinements of the categories identified by the 9-intersection, a model for topological spatial relations, and provide a more precise measure than does topology alone as to whether a geometric configuration matches with a spatial term or not. Similarly, these measures help in identifying the spatial term that describes a particular configuration. Two groups of metric details are derived: {\em splitting ratios\/} as the normalized values of lengths and areas of intersections; and {\em closeness measures\/} as the normalized distances between disjoint object parts. The resulting model of topological and metric properties was calibrated for 64 spatial terms in English, providing values for the best fit as well as value ranges for the significant parameters of each term. Three examples demonstrate how the framework and its calibrated values are used to determine the best spatial term for a relationship between two geometric objects.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "design; human factors", subject = "{\bf H.2.8} Information Systems, DATABASE MANAGEMENT, Database Applications, Spatial databases and GIS. {\bf H.2.3} Information Systems, DATABASE MANAGEMENT, Languages, Query languages. {\bf H.3.3} Information Systems, INFORMATION STORAGE AND RETRIEVAL, Information Search and Retrieval, Query formulation. {\bf H.3.3} Information Systems, INFORMATION STORAGE AND RETRIEVAL, Information Search and Retrieval, Search process. {\bf H.3.3} Information Systems, INFORMATION STORAGE AND RETRIEVAL, Information Search and Retrieval, Selection process. {\bf I.2.1} Computing Methodologies, ARTIFICIAL INTELLIGENCE, Applications and Expert Systems, Cartography. {\bf I.2.7} Computing Methodologies, ARTIFICIAL INTELLIGENCE, Natural Language Processing, Language parsing and understanding. {\bf I.5.1} Computing Methodologies, PATTERN RECOGNITION, Models, Geometric.", } @Article{Kolda:1998:SMD, author = "Tamara G. Kolda and Dianne P. O'Leary", title = "A semidiscrete matrix decomposition for latent semantic indexing information retrieval", journal = j-TOIS, volume = "16", number = "4", pages = "322--346", month = oct, year = "1998", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Mon Jul 26 16:33:55 MDT 1999", bibsource = "http://www.acm.org/pubs/toc/; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80/pubs/citations/journals/tois/1998-16-4/p322-kolda/", abstract = "The vast amount of textual information available today is useless unless it can be effectively and efficiently searched. The goal in information retrieval is to find documents that are relevant to a given user query. We can represent and document collection by a matrix whose $(i, j)$ entry is nonzero only if the $i$th term appears in the {\em j\/}th document; thus each document corresponds to a column vector. The query is also represented as a column vector whose $i$th term is nonzero only if the $i$th term appears in the query. We score each document for relevancy by taking its inner product with the query. The highest-scoring documents are considered the most relevant. Unfortunately, this method does not necessarily retrieve all relevant documents because it is based on literal term matching. Latent semantic indexing (LSI) replaces the document matrix with an approximation generated by the truncated singular-value decomposition (SVD). This method has been shown to overcome many difficulties associated with literal term matching. In this article we propose replacing the SVD with the semidiscrete decomposition (SDD). We will describe the SDD approximation, show how to compute it, and compare the SDD-based LSI method to the SVD-based LSI methods. We will show that SDD-based LSI does as well as SVD-based LSI in terms of document retrieval while requiring only one-twentieth the storage and one-half the time to compute each query. We will also show how to update the SDD approximation when documents are added or deleted from the document collection.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "algorithms; design; performance; theory", subject = "{\bf H.3.3} Information Systems, INFORMATION STORAGE AND RETRIEVAL, Information Search and Retrieval. {\bf G.1.2} Mathematics of Computing, NUMERICAL ANALYSIS, Approximation. {\bf H.2.2} Information Systems, DATABASE MANAGEMENT, Physical Design.", } @Article{Ram:1998:CCS, author = "Sudha Ram and V. Ramesh", title = "Collaborative conceptual schema design: a process model and prototype system", journal = j-TOIS, volume = "16", number = "4", pages = "347--371", month = oct, year = "1998", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Mon Jul 26 16:33:55 MDT 1999", bibsource = "http://www.acm.org/pubs/toc/; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80/pubs/citations/journals/tois/1998-16-4/p347-ram/", abstract = "Recent years have seen an increased interest in providing support for collaborative activities among groups of users participating in various information systems design tasks such as, requirements determination and process modeling. However, little attention has been paid to the collaborative conceptual database design process. In this article, we develop a model of the collaborative conceptual schema development process and describe the design and implementation of a graphical multiuser conceptual schema design tool that is based on the model. The system we describe allows a group of users to work collaboratively on the creation of database schemas in synchronous (same-time) mode (either in a face-to-face or distributed setting). Extensive modeling support is provided to assist users in creating semantically correct conceptual schemas. The system also provides users with several graphical facilities such as, a large drawing workspace with the ability to scroll or ``jump'' to any portion of this workspace, zooming capabilities, and the ability to move object(s) to any portion of the workspace. The unique component of the system, however, is its built-in support for collaborative schema design. The system supports a relaxed WYSIWIS environment, i.e., each user can control the graphical layout of the same set of schema objects. The system ensures that changes/additions made by any user are consistent. Any conflicts that may compromise to the integrity of the shared schema are flagged and resolved by the system. The results from a preliminary experiment suggest that the use of our system in a collaborative mode improved information sharing among users, minimized conflicts, and led to a more comprehensive schema definition.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "design; management", subject = "{\bf H.2.1} Information Systems, DATABASE MANAGEMENT, Logical Design, Schema and subschema. {\bf K.6.3} Computing Milieux, MANAGEMENT OF COMPUTING AND INFORMATION SYSTEMS, Software Management. {\bf H.5.3} Information Systems, INFORMATION INTERFACES AND PRESENTATION, Group and Organization Interfaces, Collaborative computing.", } @Article{Wang:1998:SHD, author = "Weigang Wang and Roy Rada", title = "Structured hypertext with domain semantics", journal = j-TOIS, volume = "16", number = "4", pages = "372--412", month = oct, year = "1998", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Mon Jul 26 16:33:55 MDT 1999", bibsource = "http://www.acm.org/pubs/toc/; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80/pubs/citations/journals/tois/1998-16-4/p372-wang/", abstract = "One important facet of current hypertext research involves using knowledge-based techniques to develop and maintain document structures. A semantic net is one such technique. However, most semantic-net-based hypertext systems leave the linking consistency of the net to individual users. Users without guidance may accidentally introduce structural and relational inconsistencies in the semantic nets. The relational inconsistency hinders the creation of domain information models. The structural inconsistency leads to unstable documents, especially when a document is composed by computation with traversal algorithms. This work tackles to above problems by integrating logical structure and domain semantics into a semantic net. A semantic-net-based structured-hypertext model has been formalized. The model preserves structural and relational consistency after changes to the semantic net. The hypertext system (RICH) based on this model has been implemented and tested. The RICH system can define and enforce a set of rules to maintain to integrity of the semantic net and provide particular support for creating multihierarchies with the reuse of existing contents and structures. Users have found such flexible but enforceable semantics to be helpful.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "design; documentation; management", subject = "{\bf I.7.2} Computing Methodologies, DOCUMENT AND TEXT PROCESSING, Document Preparation, Hypertext/hypermedia. {\bf E.1} Data, DATA STRUCTURES, Graphs and networks. {\bf H.2.1} Information Systems, DATABASE MANAGEMENT, Logical Design, Data models. {\bf H.3.4} Information Systems, INFORMATION STORAGE AND RETRIEVAL, Systems and Software. {\bf H.5.0} Information Systems, INFORMATION INTERFACES AND PRESENTATION, General.", } @Article{Croft:1998:AI, author = "W. Bruce Croft", title = "Author Index", journal = j-TOIS, volume = "16", number = "4", pages = "413--414", month = oct, year = "1998", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Mon Jul 26 16:33:55 MDT 1999", bibsource = "http://www.acm.org/pubs/toc/; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org:80/pubs/citations/journals/tois/1998-16-4/p413-croft/", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", subject = "{\bf A.0} General Literature, GENERAL.", } @Article{Chang:1999:PRT, author = "Chen-Chuan K. Chang and H{\'e}ctor Garcia-Molina and Andreas Paepcke", title = "Predicate rewriting for translating {Boolean} queries in a heterogeneous information system", journal = j-TOIS, volume = "17", number = "1", pages = "1--39", month = jan, year = "1999", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Tue Sep 26 09:34:01 MDT 2000", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org/pubs/citations/journals/tois/1999-17-1/p1-chang/", abstract = "Searching over heterogeneous information sources is difficult in part because of the nonuniform query languages. Our approach is to allow users to compose Boolean queries in one rich front-end language. For each user query and target source, we transform the user query into a subsuming query that can be supported by the source but that may return extra documents. The results are then processed by a filter query to yield the correct final results. In this article we introduce the architecture and associated mechanism for query translation. In particular, we discuss techniques for rewriting predicates in Boolean queries into native subsuming forms, which is a basis of translating complex queries. In addition, we present experimental results for evaluating the cost of postfiltering. We also discuss the drawbacks of this approach and cases when it may not be effective. We have implemented prototype versions of these mechanisms and demonstrated them on heterogeneous Boolean systems.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", generalterms = "Algorithms; Experimentation; Languages; Measurement", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Boolean queries; content-based retrieval; filtering; predicate rewriting; query subsumption; query translation", subject = "Information Systems --- Database Management --- Languages (H.2.3): {\bf Query languages}; Information Systems --- Database Management --- Heterogeneous Databases (H.2.5); Information Systems --- Information Storage and Retrieval --- Information Search and Retrieval (H.3.3): {\bf Query formulation}; Information Systems --- Information Storage and Retrieval --- Information Search and Retrieval (H.3.3): {\bf Search process}; Information Systems --- Information Storage and Retrieval --- Digital Libraries (H.3.7): {\bf Systems issues}", } @Article{Hawking:1999:MIS, author = "David Hawking and Paul Thistlewaite", title = "Methods for information server selection", journal = j-TOIS, volume = "17", number = "1", pages = "40--76", month = jan, year = "1999", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Tue Sep 26 09:34:01 MDT 2000", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org/pubs/citations/journals/tois/1999-17-1/p40-hawking/", abstract = "The problem of using a broker to select a subset of available information servers in order to achieve a good trade-off between document retrieval effectiveness and cost is addressed. Server selection methods which are capable of operating in the absence of global information, and where servers have no knowledge of brokers, are investigated. A novel method using Lightweight Probe queries (LWP method) is compared with several methods based on data from past query processing, while Random and Optimal server rankings serve as controls. Methods are evaluated, using TREC data and relevance judgments, by computing ratios, both empirical and ideal, of recall and early precision for the subset versus the complete set of available servers. Estimates are also made of the best-possible performance of each of the methods. LWP and Topic Similarity methods achieved best results, each being capable of retrieving about 60\% of the relevant documents for only one-third of the cost of querying all servers. Subject to the applicable cost model, the LWP method is likely to be preferred because it is suited to dynamic environments. The good results obtained with a simple automatic LWP implementation were replicated using different data and a larger set of query topics.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", generalterms = "Design; Experimentation; Performance", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "information servers; Lightweight Probe queries; network servers; server ranking; server selection; text retrieval", subject = "Computer Systems Organization --- Computer-Communication Networks --- Distributed Systems (C.2.4): {\bf Distributed databases}; Information Systems --- Information Storage and Retrieval --- Information Search and Retrieval (H.3.3): {\bf Search process}; Information Systems --- Information Storage and Retrieval --- Information Search and Retrieval (H.3.3): {\bf Selection process}; Information Systems --- Information Storage and Retrieval --- Systems and Software (H.3.4): {\bf Information networks}; Information Systems --- Information Storage and Retrieval --- Library Automation (H.3.6): {\bf Large text archives}", } @Article{Tan:1999:EIG, author = "Bernard C. Y. Tan and Kwok-kee Wei and Richard T. Watson", title = "The equalizing impact of a group support system on status differentials", journal = j-TOIS, volume = "17", number = "1", pages = "77--100", month = jan, year = "1999", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Tue Sep 26 09:34:01 MDT 2000", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org/pubs/citations/journals/tois/1999-17-1/p77-tan/", abstract = "This study investigates the impact of the electronic communication capability of a group support system (GSS) on status differentials in small groups. A laboratory experiment was used to answer the research questions. Three support levels were studied: manual, face-to-face GSS, and dispersed GSS. Two task types were examined: intellective and preference. Five dependent variables reflecting different aspects of status differentials were measured: status influence, sustained influence, residual disagreement, perceived influence, and decision confidence. The results show that manual groups had higher status influence, sustained influence, and decision confidence, but lower residual disagreement than face-to-face GSS and dispersed GSS groups. Preference task groups also produced higher status influence and sustained influence, but lower residual disagreement compared to intellective task groups. In addition, manual groups working on the preference task reported higher perceived influence than face-to-face GSS and dispersed GSS groups working on the same task. These findings suggest that when groups are engaged in activities for which status differentials are undesirable, a GSS can be used in both face-to-face and dispersed settings to dampen status differentials. Moreover, when a task amplifies status differentials, the use of a GSS tends to produce corresponding stronger dampening effects.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", generalterms = "Management; Theory", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "electronic communication; group support systems; status differentials; task type", subject = "Information Systems --- Information Systems Applications --- Communications Applications (H.4.3); Information Systems --- Information Interfaces and Presentation --- Group and Organization Interfaces (H.5.3); Computer Applications --- Social and Behavioral Sciences (J.4)", } @Article{Bertino:1999:FAM, author = "Elisa Bertino and Sushil Jajodia and Pierangela Samarati", title = "A flexible authorization mechanism for relational data management systems", journal = j-TOIS, volume = "17", number = "2", pages = "101--140", month = apr, year = "1999", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Tue Sep 26 09:34:01 MDT 2000", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org/pubs/citations/journals/tois/1999-17-2/p101-bertino/", abstract = "In this article, we present an authorization model that can be used to express a number of discretionary access control policies for relational data management systems. The model permits both positive and negative authorizations and supports exceptions at the same time. The model is flexible in that the users can specify, for each authorization they grant, whether the authorization can allow for exceptions or whether it must be strongly obeyed. It provides authorization management for groups with exceptions at any level of the group hierarchy, and temporary suspension of authorizations. The model supports ownership together with decentralized administration of authorizations. Administrative privileges can also be restricted so that owners retain control over their tables.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", generalterms = "Security; Theory", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "access control mechanism; access control policy; authorization; data management system; group management support; relational database", subject = "Software --- Operating Systems --- Security and Protection (D.4.6): {\bf Access controls}; Information Systems --- Database Management --- Database Administration (H.2.7): {\bf Security, integrity, and protection}; Information Systems --- Database Management --- General (H.2.0): {\bf Security, integrity, and protection**}", } @Article{Cohen:1999:CSL, author = "William W. Cohen and Yoram Singer", title = "Context-sensitive learning methods for text categorization", journal = j-TOIS, volume = "17", number = "2", pages = "141--173", month = apr, year = "1999", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Tue Sep 26 09:34:01 MDT 2000", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org/pubs/citations/journals/tois/1999-17-2/p141-cohen/", abstract = "Two recently implemented machine-learning algorithms, {\em RIPPER\/} and {\em sleeping-experts for phrases}, are evaluated on a number of large text categorization problems. These algorithms both construct classifiers that allow the ``context'' of a word {\em w\/} to affect how (or even whether) the presence or absence of {\em w\/} will contribute to a classification. However, RIPPER and sleeping-experts differ radically in many other respects: differences include different notions as to what constitutes a context, different ways of combining contexts to construct a classifier, different methods to search for a combination of contexts, and different criteria as to what contexts should be included in such a combination. In spite of these differences, both RIPPER and sleeping-experts perform extremely well across a wide variety of categorization problems, generally outperforming previously applied learning methods. We view this result as a confirmation of the usefulness of classifiers that represent contextual information.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", generalterms = "Algorithms; Experimentation", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "context-sensitive models; mistake-driven algorithms; on-line learning; rule learning; text categorization", subject = "Information Systems --- Information Storage and Retrieval --- Information Search and Retrieval (H.3.3); Computing Methodologies --- Artificial Intelligence --- Learning (I.2.6): {\bf Concept learning}; Computing Methodologies --- Artificial Intelligence --- Learning (I.2.6): {\bf Parameter learning}; Computing Methodologies --- Pattern Recognition --- Applications (I.5.4): {\bf Text processing}; Computing Methodologies --- Artificial Intelligence --- Natural Language Processing (I.2.7): {\bf Text analysis}", } @Article{El-Kwae:1999:RFC, author = "Essam A. El-Kwae and Mansur R. Kabuka", title = "A robust framework for content-based retrieval by spatial similarity in image databases", journal = j-TOIS, volume = "17", number = "2", pages = "174--198", month = apr, year = "1999", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Tue Sep 26 09:34:01 MDT 2000", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org/pubs/citations/journals/tois/1999-17-2/p174-el-kwae/", abstract = "A framework for retrieving images by spatial similarity (FRISS) in image databases is presented. In this framework, a robust retrieval by spatial similarity (RSS) algorithm is defined as one that incorporates both directional and topological spatial constraints, retrieves similar images, and recognized images even after they undergo translation, scaling, rotation (both perfect and multiple), or any arbitrary combination of transformations. The FRISS framework is discussed and used as a base for comparing various existing RSS algorithms. Analysis shows that none of them satisfies all the FRISS specifications. An algorithm, {\em SIM dtc}, is then presented. {\em SIM dtc\/} introduces the concept of a {\em rotation correction angle\/} (RCA) to align objects in one image spatially closer to matching objects in another image for more accurate similarity assessment. Similarity between two images is a function of the number of common objects between them and the closeness of directional and topological spatial relationships between object pairs in both images. The {\em SIM dtc\/} retrieval is invariant under translation, scaling, and perfect rotation, and the algorithm is able to rank multiple rotation variants. The algorithm was tested using synthetic images and the TESSA image database. Analysis shows the robustness of the {\em SIM dtc\/} algorithm over current algorithms.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", generalterms = "Algorithms; Design; Experimentation; Measurement", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "content-based retrieval; image databases; multimedia databases; query formulation; retrieval models; similarity retrieval; spatial similarity", subject = "Information Systems --- Information Storage and Retrieval --- Information Search and Retrieval (H.3.3): {\bf Retrieval models}; Information Systems --- Information Storage and Retrieval --- Information Search and Retrieval (H.3.3): {\bf Query formulation}", } @Article{Shipman:1999:IFH, author = "Frank M. Shipman and Raymond J. McCall", title = "Incremental formalization with the hyper-object substrate", journal = j-TOIS, volume = "17", number = "2", pages = "199--227", month = apr, year = "1999", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Tue Sep 26 09:34:01 MDT 2000", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org/pubs/citations/journals/tois/1999-17-2/p199-shipman/", abstract = "Computers require formally represented information to perform computations that support users; yet users who have needed such support have often proved to be unable or unwilling to formalize it. To address this problem, this article introduces an approach called incremental formalization, in which, first, users express information informally and then the system aids them in formalizing it. Incremental formalization requires a system architecture the (1) integrates formal and informal representations and (2) supports progressive formalization of information. The system should have both tools to capture naturally available informal information and techniques to suggest possible formalizations of this information. The hyper-object substrate (HOS) was developed to satisfy these requirements. HOS has been applied to a number of problem domains, including network design, archaeological site analysis, and neuroscience education. Users have been successful in adding informal information and then later formalizing it incrementally with the aid of the system. Our experience with HOS has reaffirmed the need for information spaces to evolve during use and has identified additional considerations in the design and instantiation of systems enabling and supporting incremental formalization", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", generalterms = "Design; Human Factors", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", subject = "Information Systems --- Information Interfaces and Presentation --- User Interfaces (H.5.2); Information Systems --- Information Interfaces and Presentation --- Hypertext/Hypermedia (H.5.4); Computing Methodologies --- Artificial Intelligence --- Knowledge Representation Formalisms and Methods (I.2.4)", } @Article{Fuhr:1999:DTA, author = "Norbert Fuhr", title = "A decision-theoretic approach to database selection in networked {IR}", journal = j-TOIS, volume = "17", number = "3", pages = "229--229", month = jul, year = "1999", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Tue Sep 26 09:34:01 MDT 2000", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org/pubs/citations/journals/tois/1999-17-3/p229-fuhr/", abstract = "In networked IR, a client submits a query to a broker, which is in contact with a large number of databases. In order to yield a maximum number of documents at minimum cost, the broker has to make estimates about the retrieval cost of each database, and then decide for each database whether or not to use it for the current query, and if, how many documents to retrieve from it. For this purpose, we develop a general decision-theoretic model and discuss different cost structures. Besides cost for retrieving relevant versus nonrelevant documents, we consider the following parameters for each database: expected retrieval quality, expected number of relevant documents in the database and cost factors for query processing and document delivery. For computing the overall optimum, a divide-and-conquer algorithm is given. If there are several brokers knowing different databases, a preselection of brokers can only be performed heuristically, but the computation of the optimum can be done similarly to the single-broker case. In addition, we derive a formula which estimates the number of relevant documents in a database based on dictionary information.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", generalterms = "Theory", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "networked retrieval; probabilistic retrieval; probability ranking principle; resource discovery", subject = "Information Systems --- Information Storage and Retrieval --- Information Search and Retrieval (H.3.3): {\bf Retrieval models}; Information Systems --- Information Storage and Retrieval --- Systems and Software (H.3.4): {\bf Information networks}", } @Article{Gauch:1999:CAA, author = "Susan Gauch and Jianying Wang and Satya Mahesh Rachakonda", title = "A corpus analysis approach for automatic query expansion and its extension to multiple databases", journal = j-TOIS, volume = "17", number = "3", pages = "250--250", month = jul, year = "1999", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Tue Sep 26 09:34:01 MDT 2000", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org/pubs/citations/journals/tois/1999-17-3/p250-gauch/", abstract = "Searching online text collections can be both rewarding and frustrating. While valuable information can be found, typically many irrelevant documents are also retrieved, while many relevant ones are missed. Terminology mismatches between the user's query and document contents are a main cause of retrieval failures. Expanding a user's query with related words can improve search performances, but finding and using related words is an open problem. This research uses corpus analysis techniques to automatically discover similar words directly from the contents of the databases which are not tagged with part-of-speech labels. Using these similarities, user queries are automatically expanded, resulting in conceptual retrieval rather than requiring exact word matches between queries and documents. We are able to achieve a 7.6\% improvement for TREC 5 queries and up to a 28.5\% improvement on the narrow-domain Cystic Fibrosis collection. This work has been extended to multidatabase collections where each subdatabase has a collection-specific similarity matrix associated with it. If the best matrix is selected, substantial search improvements are possible. Various techniques to select the appropriate matrix for a particular query are analyzed, and a 4.8\% improvement in the results is validated.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", generalterms = "Algorithms; Experimentation", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "query expansion", subject = "Information Systems --- Information Storage and Retrieval --- Content Analysis and Indexing (H.3.1): {\bf Linguistic processing}; Information Systems --- Information Storage and Retrieval --- Content Analysis and Indexing (H.3.1): {\bf Thesauruses}; Information Systems --- Information Storage and Retrieval --- Information Search and Retrieval (H.3.3): {\bf Query formulation}", } @Article{Goh:1999:CIN, author = "Cheng Hian Goh and St{\'e}phane Bressan and Stuart Madnick and Michael Siegel", title = "Context interchange: new features and formalisms for the intelligent integration of information", journal = j-TOIS, volume = "17", number = "3", pages = "270--270", month = jul, year = "1999", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Tue Sep 26 09:34:01 MDT 2000", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org/pubs/citations/journals/tois/1999-17-3/p270-goh/", abstract = "The {\em Context Interchange strategy\/} presents a novel perspective for mediated data access in which semantic conflicts among heterogeneous systems are not identified a priori, but are detected and reconciled by a {\em context mediator\/} through comparison of {\em contexts axioms\/} corresponding to the systems engaged in data exchange. In this article, we show that queries formulated on shared views, export schema, and shared ``ontologies'' can be mediated in the same way using the {\em Context Interchange framework}. The proposed framework provides a logic-based object-oriented formalism for representing and reasoning about data semantics in disparate systems, and has been validated in a prototype implementation providing mediated data access to both traditional and web-based information sources.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", generalterms = "Design", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "abductive reasoning; information integration; mediators; semantic heterogeneity; semantic interoperability", subject = "Information Systems --- Database Management --- Systems (H.2.4): {\bf Query processing}; Information Systems --- Database Management --- Heterogeneous Databases (H.2.5): {\bf Data translation**}; Information Systems --- Database Management --- Heterogeneous Databases (H.2.5)", } @Article{Lim:1999:HDQ, author = "Ee-Peng Lim and Ying Lu", title = "{Harp}: a distributed query system for legacy public libraries and structured databases", journal = j-TOIS, volume = "17", number = "3", pages = "294--294", month = jul, year = "1999", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Tue Sep 26 09:34:01 MDT 2000", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org/pubs/citations/journals/tois/1999-17-3/p294-lim/", abstract = "The main purpose of a digital library is to facilitate users easy access to enormous amount of globally networked information. Typically, this information includes preexisting public library catalog data, digitized document collections, and other databases. In this article, we describe the distributed query system of a digital library prototype system known as HARP. In the HARP project, we have designed and implemented a distributed query processor and its query front-end to support integrated queries to preexisting public library catalogs and structured databases. This article describes our experiences in the design of an extended Sequel (SQL) query language known as HarpSQL. It also presents the design and implementation of the distributed query system. Our experience in distributed query processor and user interface design and development will be highlighted. We believe that our prototyping effort will provide useful lessons to the development of a complete digital library infrastructure.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", generalterms = "Design; Languages", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "digital libraries; Internet databases; interoperable databases", subject = "Information Systems --- Information Storage and Retrieval (H.3); Information Systems --- Information Interfaces and Presentation --- User Interfaces (H.5.2): {\bf User interface management systems (UIMS)}", } @Article{Plaisant:1999:IDA, author = "Catherine Plaisant and Ben Shneiderman and Khoa Doan and Tom Bruns", title = "Interface and data architecture for query preview in networked information systems", journal = j-TOIS, volume = "17", number = "3", pages = "320--320", month = jul, year = "1999", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Tue Sep 26 09:34:01 MDT 2000", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org/pubs/citations/journals/tois/1999-17-3/p320-plaisant/", abstract = "There are numerous problems associated with formulating queries on networked information systems. These include increased data volume and complexity, accompanied by slow network access. This article proposes a new approach to a network query user interfaces that consists of two phases: query preview and query refinement. This new approach is based on the concepts of dynamic queries and query previews, which guides users in rapidly and dynamically eliminating undesired records, reducing the data volume to a manageable size, and refining queries locally before submission over a network. Examples of two applications are given: a Restaurant Finder and a prototype for NASA's Earth Observing Systems Data Information Systems (EOSDIS). Data architecture is discussed, and user feedback is presented.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", generalterms = "Design; Human Factors", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "direct manipulation; dynamic query; EOSDIS; graphical user interface; query preview; query refinement; science data", subject = "Information Systems --- Information Storage and Retrieval --- Information Search and Retrieval (H.3.3): {\bf Query formulation}; Information Systems --- Information Interfaces and Presentation --- User Interfaces (H.5.2)", } @Article{Chen:1999:IGL, author = "Hao Chen and Jianying Hu and Richard W. Sproat", title = "Integrating geometrical and linguistic analysis for email signature block parsing", journal = j-TOIS, volume = "17", number = "4", pages = "343--366", month = oct, year = "1999", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Tue Sep 26 09:34:01 MDT 2000", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org/pubs/articles/journals/tois/1999-17-4/p343-chen/p343-chen.pdf; http://www.acm.org/pubs/citations/journals/tois/1999-17-4/p343-chen/", abstract = "The signature block is a common structured component found in email messages. Accurate identification and analysis of signature blocks is important in many multimedia messaging and information retrieval applications such as email text-to-speech rendering, automatic construction of personal address databases, and interactive message retrieval. It is also a very challenging task, because signature blocks often appear in complex two-dimensional layouts which are guided only by loose conventions. Traditional text analysis methods designed to deal with sequential text cannot handle two-dimensional structures, while the highly unconstrained nature of signature blocks makes the application of two-dimensional grammars very difficult. In this article, we describe an algorithm for signature block analysis which combines two-dimensional structural segmentation with one-dimensional grammatical constraints. The information obtained from both layout and linguistic analysis is integrated in the form of weighted finite-state transducers. The algorithm is currently implemented as a component in a preprocessing system for email text-to-speech rendering.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", generalterms = "Algorithms", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "email signature block; finite-state transducer; geometrical analysis; linguistic analysis; text-to-speech rendering", subject = "Information Systems --- Information Storage and Retrieval --- Information Search and Retrieval (H.3.3): {\bf Selection process}; Information Systems --- Information Systems Applications --- Communications Applications (H.4.3): {\bf Electronic mail}", } @Article{Greiff:1999:PMC, author = "Warren R. Greiff and W. Bruce Croft and Howard Turtle", title = "{PIC} matrices: a computationally tractable class of probabilistic query operators", journal = j-TOIS, volume = "17", number = "4", pages = "367--405", month = oct, year = "1999", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Tue Sep 26 09:34:01 MDT 2000", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org/pubs/citations/journals/tois/1999-17-4/p367-greiff/", abstract = "The inference network model of information retrieval allows a probabilistic interpretation of query operators. In particular, Boolean query operators are conveniently modeled as link matrices of the Bayesian Network. Prior work has shown, however, that these operators do not perform as well as the {\em pnorm\/} operators used for modeling query operators in the context of the vector space model. This motivates the search for alternative probabilistic formulations for these operators. The design of such alternatives must contend with the issue of computational tractability, since the evaluation of an arbitrary operator requires exponential time. We define a flexible class of link matrices that are natural candidates for the implementation of query operators and an $O(n^2)$ algorithm ($n$ = the number of parent nodes) for the computation of probabilities involving link matrices of this class. We present experimental results indicating that Boolean operators implemented in terms of link matrices from this class perform as well as {\em pnorm\/} operators in the context of the INQUERY inference network.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", generalterms = "Algorithms; Performance; Theory", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Bayesian networks; Boolean queries; computational complexity; inference networks; link matrices; piecewise linear functions; pnorm; probabilistic information retrieval; query operators", subject = "Information Systems --- Information Storage and Retrieval --- Information Search and Retrieval (H.3.3): {\bf Query formulation}", } @Article{Kaszkiel:1999:EPR, author = "Marcin Kaszkiel and Justin Zobel and Ron Sacks-Davis", title = "Efficient passage ranking for document databases", journal = j-TOIS, volume = "17", number = "4", pages = "406--439", month = oct, year = "1999", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Tue Sep 26 09:34:01 MDT 2000", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org/pubs/citations/journals/tois/1999-17-4/p406-kaszkiel/", abstract = "Queries to text collections are resolved by ranking the documents in the collection and returning the highest-scoring documents to the user. An alternative retrieval method is to rank passages, that is, short fragments of documents, a strategy that can improve effectiveness and identify relevant material in documents that are too large for users to consider as a whole. However, ranking of passages can considerably increase retrieval costs. In this article we explore alternative query evaluation techniques, and develop new techniques for evaluating queries on passages. We show experimentally that, appropriately implemented, effective passage retrieval is practical in limited memory on a desktop machine. Compared to passage ranking with adaptations of current document ranking algorithms, our new ``DO-TOS'' passage-ranking algorithm requires only a fraction of the resources, at the cost of a small loss of effectiveness.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", generalterms = "Algorithms; Performance", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "inverted files; passage retrieval; query evaluation; text databases; text retrieval", subject = "Data --- Files (E.5); Information Systems --- Database Management --- Physical Design (H.2.2); Information Systems --- Information Storage and Retrieval --- Information Search and Retrieval (H.3.3)", } @Article{Sanderson:1999:IRE, author = "Mark Sanderson and C. J. {Van Rijsbergen}", title = "The impact on retrieval effectiveness of skewed frequency distributions", journal = j-TOIS, volume = "17", number = "4", pages = "440--465", month = oct, year = "1999", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Tue Sep 26 09:34:01 MDT 2000", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org/pubs/citations/journals/tois/1999-17-4/p440-sanderson/", abstract = "We present an analysis of word senses that provides a fresh insight into the impact of word ambiguity on retrieval effectiveness with potential broader implications for other processes of information retrieval. Using a methodology of forming artificially ambiguous words, known as pseudowords, and through reference to other researchers' work, the analysis illustrates that the distribution of the frequency of occurrence of the senses of a word plays a strong role in ambiguity's impact of effectiveness. Further investigation shows that this analysis may also be applicable to other processes of retrieval, such as Cross Language Information Retrieval, query expansion, retrieval of OCR'ed texts, and stemming. The analysis appears to provide a means of explaining, at least in part, reasons for the processes' impact (or lack of it) on effectiveness.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", generalterms = "Experimentation; Measurement", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "pseudowords; word sense ambiguity; word sense disambiguation", subject = "Information Systems --- Information Storage and Retrieval --- Content Analysis and Indexing (H.3.1): {\bf Linguistic processing}; Computing Methodologies --- Artificial Intelligence --- Natural Language Processing (I.2.7): {\bf Text analysis}; Computing Methodologies --- Simulation and Modeling --- Model Validation and Analysis (I.6.4); Information Systems --- Information Storage and Retrieval --- Information Search and Retrieval (H.3.3): {\bf Search process}", } @Article{Cahoon:2000:EPD, author = "Brendon Cahoon and Kathryn S. McKinley and Zhihong Lu", title = "Evaluating the performance of distributed architectures for information retrieval using a variety of workloads", journal = j-TOIS, volume = "18", number = "1", pages = "1--43", month = jan, year = "2000", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Tue Sep 26 09:34:01 MDT 2000", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org/pubs/citations/journals/tois/2000-18-1/p1-cahoon/", abstract = "The information explosion across the Internet and elsewhere offers access to an increasing number of document collections. In order for users to effectively access these collections, information retrieval (IR) systems must provide coordinated, concurrent, and distributed access. In this article, we explore how to achieve scalable performance in a distributed system for collection sizes ranging from 1GB to 128GB. We implement a fully functional distributed IR system based on a multithreaded version of the Inquery simulation model. We measure performance as a function of system parameters such as client command rate, number of document collections, ter ms per query, query term frequency, number of answers returned, and command mixture. Our results show that it is important to model both query and document commands because the heterogeneity of commands significantly impacts performance. Based on our results, we recommend simple changes to the prototype and evaluate the changes using the simulator. Because of the significant resource demands of information retrieval, it is not difficult to generate workloads that overwhelm system resources regardless of the architecture. However under some realistic workloads, we demonstrate system organizations for which response time gracefully degrades as the workload increases and performance scales with the number of processors. This scalable architecture includes a surprisingly small number of brokers through which a large number of clients and servers communicate.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "distributed information retrieval architectures", subject = "Computer Systems Organization --- Computer-Communication Networks --- Distributed Systems (C.2.4); Computer Systems Organization --- Performance of Systems (C.4); Computer Systems Organization --- Performance of Systems (C.4): {\bf Performance attributes}; Information Systems --- Information Storage and Retrieval --- Systems and Software (H.3.4)", } @Article{Clarke:2000:SSR, author = "Charles L. A. Clarke and Gordon V. Cormack", title = "Shortest-substring retrieval and ranking", journal = j-TOIS, volume = "18", number = "1", pages = "44--78", month = jan, year = "2000", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Tue Sep 26 09:34:01 MDT 2000", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org/pubs/citations/journals/tois/2000-18-1/p44-clarke/", abstract = "We present a model for arbitrary passage retrieval using Boolean queries. The model is applied to the task of ranking documents, or other structural elements, in the order of their expected relevance. Features such as phrase matching, truncation, and stemming integrate naturally into the model. Properties of Boolean algebra are obeyed, and the exact-match semantics of Boolean retrieval are preserved. Simple inverted-list file structures provide an efficient implementation. Retrieval effectiveness is comparable to that of standard ranking techniques. Since global statistics are not used, the method is of particular value in distributed environments. Since ranking is based on arbitrary passages, the structural elements to be ranked may be specified at query time and do not need to be restricted to predefined elements.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Boolean retrieval model; passage retrieval; relevance ranking", subject = "Information Systems --- Information Storage and Retrieval --- Information Search and Retrieval (H.3.3); Information Systems --- Information Storage and Retrieval --- Systems and Software (H.3.4); Information Systems --- Information Storage and Retrieval --- Systems and Software (H.3.4): {\bf Performance evaluation (efficiency and effectiveness)}", } @Article{Xu:2000:IEI, author = "Jinxi Xu and W. Bruce Croft", title = "Improving the effectiveness of information retrieval with local context analysis", journal = j-TOIS, volume = "18", number = "1", pages = "79--112", month = jan, year = "2000", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Tue Sep 26 09:34:01 MDT 2000", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org/pubs/citations/journals/tois/2000-18-1/p79-xu/", abstract = "Techniques for automatic query expansion have been extensively studied in information research as a means of addressing the word mismatch between queries and documents. These techniques can be categorized as either global or local. While global techniques rely on analysis of a whole collection to discover word relationships, local techniques emphasize analysis of the top-ranked documents retrieved for a query. While local techniques have shown to be more effective that global techniques in general, existing local techniques are not robust and can seriously hurt retrieved when few of the retrieval documents are relevant. We propose a new technique, called {\em local context analysis,\/} which selects expansion terms based on cooccurrence with the query terms within the top-ranked documents. Experiments on a number of collections, both English and non-English, show that local context analysis offers more effective and consistent retrieval results.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "cooccurrence; document analysis; feedback; global techniques; information retrieval; local context analysis; local techniques", subject = "Information Systems --- Information Storage and Retrieval --- Content Analysis and Indexing (H.3.1); Information Systems --- Information Storage and Retrieval --- Content Analysis and Indexing (H.3.1): {\bf Indexing methods}; Information Systems --- Information Storage and Retrieval --- Content Analysis and Indexing (H.3.1): {\bf Thesauruses}; Information Systems --- Information Storage and Retrieval --- Content Analysis and Indexing (H.3.1): {\bf Linguistic processing}; Information Systems --- Information Storage and Retrieval --- Information Search and Retrieval (H.3.3); Information Systems --- Information Storage and Retrieval --- Information Search and Retrieval (H.3.3): {\bf Query formulation}; Information Systems --- Information Storage and Retrieval --- Information Search and Retrieval (H.3.3): {\bf Search process}; Information Systems --- Information Storage and Retrieval --- Information Search and Retrieval (H.3.3): {\bf Relevance feedback}", } @Article{SilvadeMoura:2000:FFW, author = "Edleno {Silva de Moura} and Gonzalo Navarro and Nivio Ziviani and Ricardo Baeza-Yates", title = "Fast and flexible word searching on compressed text", journal = j-TOIS, volume = "18", number = "2", pages = "113--139", month = apr, year = "2000", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Tue Sep 26 09:34:01 MDT 2000", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org/pubs/citations/journals/tois/2000-18-2/p113-silva_de_moura/", abstract = "We present a fast compression technique for natural language texts. The novelties are that (1) decompression of arbitrary portions of the text can be done very efficiently, (2) exact search for words and phrases can be done on the compressed text directly, using any known sequential pattern-matching algorithm, and (3) word-based approximate and extended search can also be done efficiently without any decoding. The compression scheme uses a semistatic word-based model and a Huffman code where the coding alphabet is byte-oriented rather than bit-oriented. We compress typical English texts to about 30\% of their original size, against 40\% and 35\% for {\em Compress\/} and {\em Gzip}, respectively. Compression time is close to that of {\em Compress\/} and approximately half of the time of {\em Gzip}, and decompression time is lower than that of {\em Gzip\/} and one third of that of {\em Compress}. We present three algorithms to search the compressed text. They allow a large number of variations over the basic word and phrase search capability, such as sets of characters, arbitrary regular expressions, and approximate matching. Separators and stopwords can be discarded at search time without significantly increasing the cost. When searching for simple words, the experiments show that running our algorithms on a compressed text is twice as fast as running the best existing software on the uncompressed version of the same text. When searching complex or approximate patterns, our algorithms are up to 8 times faster than the search on uncompressed text. We also discuss the impact of our technique in inverted files pointing to logical blocks and argue for the possibility of keeping the text compressed all the time, decompressing only for displaying purposes.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "compressed pattern matching; natural language text compression; word searching; word-based Huffman coding", subject = "Data --- Coding and Information Theory (E.4): {\bf Data compaction and compression}; Information Systems --- Information Storage and Retrieval --- Information Search and Retrieval (H.3.3): {\bf Search process}", } @Article{Dourish:2000:EDM, author = "Paul Dourish and W. Keith Edwards and Anthony LaMarca and John Lamping and Karin Petersen and Michael Salisbury and Douglas B. Terry and James Thornton", title = "Extending document management systems with user-specific active properties", journal = j-TOIS, volume = "18", number = "2", pages = "140--170", month = apr, year = "2000", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Tue Sep 26 09:34:01 MDT 2000", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org/pubs/citations/journals/tois/2000-18-2/p140-dourish/", abstract = "Document properties are a compelling infrastructure on which to develop document management applications. A property-based approach avoids many of the problems of traditional hierarchical storage mechanisms, reflects document organizations meaningful to user tasks, provides a means to integrate the perspectives of multiple individuals and groups, and does this all within a uniform interaction framework. Document properties can reflect not only categorizations of documents and document use, but also expressions of desired system activity, such as sharing criteria, replication management, and versioning. Augmenting property-based document management systems with active properties that carry executable code enables the provision of document-based services on a property infrastructure. The combination of document properties as a uniform mechanism for document management, and active properties as a way of delivering document services, represents a new paradigm for document management infrastructures. The Placeless Documents system is an experimental prototype developed to explore this new paradigm. It is based on the seamless integration of user-specific, active properties. We present the fundamental design approach, explore the challenges and opportunities it presents, and show our architectures deals with them.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "active properties; component software; document management systems; document services; user experience", subject = "Computer Systems Organization --- Computer-Communication Networks --- Distributed Systems (C.2.4): {\bf Distributed databases}; Software --- Operating Systems --- File Systems Management (D.4.3): {\bf Distributed file systems}; Data --- Files (E.5): {\bf Organization/structure}; Information Systems --- Information Storage and Retrieval --- Information Storage (H.3.2): {\bf File organization}; Information Systems --- Information Storage and Retrieval --- Systems and Software (H.3.4): {\bf Distributed systems}; Information Systems --- Information Storage and Retrieval --- Information Search and Retrieval (H.3.3): {\bf Search process}", } @Article{El-Kwae:2000:ECB, author = "Essam A. El-Kwae and Mansur R. Kabuka", title = "Efficient content-based indexing of large image databases", journal = j-TOIS, volume = "18", number = "2", pages = "171--210", month = apr, year = "2000", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Tue Sep 26 09:34:01 MDT 2000", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org/pubs/citations/journals/tois/2000-18-2/p171-el-kwae/", abstract = "Large image databases have emerged in various applications in recent years. A prime requisite of these databases is the means by which their contents can be indexed and retrieved. A multilevel signature file called the Two Signature Multi-level Signature File ( {\em 2SMLSF\/} ) is introduced as an efficient access structure for large image databases. The {\em 2SMLSF\/} encodes image information into binary signatures and creates a tree structures can be efficiently searched to satisfy a user's query. Two types of signatures are generated. Type {\em I\/} signatures are used at all tree levels except the leaf level and are based only on the domain objects included in the image. Type {\em II\/} signatures, on the other hand, are stored at the leaf level and are based on the included domain objects and their spatial relationships. The {\em 2SMLSF\/} was compared analytically to existing signature file techniques. The {\em 2SMLSF\/} significantly reduces the storage requirements; the index structure can answer more queries; and the {\em 2SMLSF\/} performance significantly improves over current techniques. Both storage reduction and performance improvement increase with the number of objects per image and the number of images in the database. For an example large image database, a storage reduction of 78\% may be achieved while the performance improvement may reach 98\%.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "content analysis and indexing; document managing; image databases; index generation; multimedia databases", } @Article{Anderson:2000:CHH, author = "Kenneth M. Anderson and Richard N. Taylor and E. James Whitehead", title = "{Chimera}: hypermedia for heterogeneous software development enviroments", journal = j-TOIS, volume = "18", number = "3", pages = "211--245", year = "2000", bibdate = "Tue Apr 17 08:10:03 MDT 2001", bibsource = "http://www.acm.org/pubs/toc/; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org/pubs/citations/journals/tois/2000-18-3/p211-anderson/", abstract = "Emerging software development environments are characterized by heterogeneity: they are composed of diverse object stores, user interfaces, and tools. This paper presents an approach for providing hypermedia services in this heterogeneous setting. Central notions of the approach include the following: anchors are established with respect to interactive {\em views\/} of objects, rather than the objects themselves; composable, $n$-ary links can be established between anchors on different views of objects which may be stored in distinct object bases; viewers may be implemented in different programming languages; and, hypermedia services are provided to multiple, concurrently active, viewers. The paper describes the approach, supporting architecture, and lessons learned. Related work in the areas of supporting heterogeneity and hypermedia data modeling is discussed. The system has been employed in a variety of contexts including research, development, and education.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", generalterms = "Design", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "heterogeneous hypermedia; hypermedia system architectures; link servers; open hypermedia systems; software development environments", subject = "Information Systems --- Information Interfaces and Presentation --- Multimedia Information Systems (H.5.1); Software --- Software Engineering --- Design Tools and Techniques (D.2.2); Computing Methodologies --- Document and Text Processing --- Document Preparation (I.7.2): {\bf Hypertext/hypermedia}; Information Systems --- Information Interfaces and Presentation --- Hypertext/Hypermedia (H.5.4)", } @Article{Greiff:2000:MEA, author = "Warren R. Greiff and Jay M. Ponte", title = "The maximum entropy approach and probabilistic {IR} models", journal = j-TOIS, volume = "18", number = "3", pages = "246--287", year = "2000", bibdate = "Tue Apr 17 08:10:03 MDT 2001", bibsource = "http://www.acm.org/pubs/toc/; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org/pubs/citations/journals/tois/2000-18-3/p246-greiff/", abstract = "This paper takes a fresh look at modeling approaches to information retrieval that have been the basis of much of the probabilistically motivated IR research over the last 20 years. We shall adopt a subjectivist Bayesian view of probabilities and argue that classical work on probabilistic retrieval is best understood from this perspective. The main focus of the paper will be the ranking formulas corresponding to the Binary Independence Model (BIM), presented originally by Roberston and Sparck John [1977] and the Combination Match Model (CMM), developed shortly thereafter by Croft and Harper [1979]. We will show how these same ranking formulas can result from a probabilistic methodology commonly known as Maximum Entropy (MAXENT).", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", generalterms = "Theory", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "", subject = "Information Systems --- Information Storage and Retrieval --- Information Search and Retrieval (H.3.3): {\bf Retrieval models}", } @Article{Cohen:2000:DIU, author = "William W. Cohen", title = "Data integration using similarity joins and a word-based information representation language", journal = j-TOIS, volume = "18", number = "3", pages = "288--321", year = "2000", bibdate = "Tue Apr 17 08:10:03 MDT 2001", bibsource = "http://www.acm.org/pubs/toc/; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org/pubs/citations/journals/tois/2000-18-3/p288-cohen/", abstract = "The integration of distributed, heterogeneous databases, such as those available on the World Wide Web, poses many problems. Herer we consider the problem of integrating data from sources that lack common object identifiers. A solution to this problem is proposed for databases that contain informal, natural-language ``names'' for objects; most Web-based databases satisfy this requirement, since they usually present their information to the end-user through a veneer of text. We describe WHIRL, a ``soft'' database management system which supports ``similarity joins,'' based on certain robust, general-purpose similarity metrics for text. This enables fragments of text (e.g., informal names of objects) to be used as keys. WHIRL includes textual objects as a built-in type, similarity reasoning as a built-in predicate, and answers every query with a list of answer substitutions that are ranked according to an overall score. Experiments show that WHIRL is much faster than naive inference methods, even for short queries, and efficient on typical queries to real-world databases with tens of thousands of tuples. Inferences made by WHIRL are also surprisingly accurate, equaling the accuracy of hand-coded normalization routines on one benchmark problem, and outperforming exact matching with a plausible global domain on a second.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", generalterms = "Reliability", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", subject = "Information Systems --- Database Management --- Heterogeneous Databases (H.2.5); Information Systems --- Database Management --- Languages (H.2.3): {\bf Data manipulation languages (DML)}; Information Systems --- Database Management --- Languages (H.2.3): {\bf Query languages}; Information Systems --- Information Storage and Retrieval --- Information Search and Retrieval (H.3.3): {\bf Retrieval models}", } @Article{Fraternali:2000:MDD, author = "Piero Fraternali and Paolo Paolini", title = "Model-driven development of {Web} applications: the {AutoWeb} system", journal = j-TOIS, volume = "18", number = "4", pages = "323--382", year = "2000", bibdate = "Tue Apr 17 08:10:03 MDT 2001", bibsource = "http://www.acm.org/pubs/toc/; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org/pubs/citations/journals/tois/2000-18-4/p323-fraternali/", abstract = "This paper describes a methodology for the development of WWW applications and a tool environment specifically tailored for the methodology. The methodology and the development environment are based upon models and techniques already used in the hypermedia, information systems, and software engineering fields, adapted and blended in an original mix. The foundation of the proposal is the conceptual design of WWW applications, using HDM-lite, a notation for the specification of structure, navigation, and presentation semantics. The conceptual schema is then translated into a ``traditional'' database schema, which describes both the organization of the content and the desired navigation and presentation features. The WWW pages can therefore be dynamically generated from the database content, following the navigation requests of the user. A CASE environment, called AutoWeb System, offers a set of software tools, which assist the design and the execution of a WWW application, in all its different aspects, Real-life experiences of the use of the methodology and of the AutoWeb System in both the industrial and academic context are reported.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", generalterms = "Design; Experimentation; Human Factors", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "application; development; HTML; intranet; modeling; WWW", subject = "Information Systems --- Information Interfaces and Presentation --- Hypertext/Hypermedia (H.5.4); Software --- Software Engineering --- Design Tools and Techniques (D.2.2)", } @Article{Katzenstein:2000:BSO, author = "Gary Katzenstein and F. Javier Lerch", title = "Beneath the surface of organizational processes: a social representation framework for business process redesign", journal = j-TOIS, volume = "18", number = "4", pages = "383--422", year = "2000", bibdate = "Tue Apr 17 08:10:03 MDT 2001", bibsource = "http://www.acm.org/pubs/toc/; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org/pubs/citations/journals/tois/2000-18-4/p383-katzenstein/", abstract = "This paper raises the question, ``What is an effective representation framework for organizational process design?'' By combining our knowledge of existing process models with data from a field study, the paper develops criteria for an effective process representation. Using these criteria and the case study, the paper integrates the process redesign and information system literatures to develop a representation framework that captures a process' social context. The paper argues that this social context framework, which represents people's motivations, social relationships, and social constraints, gives redesigners a richer sense of the process and allows process redesigners to simultaneously change social and logistic systems. The paper demonstrates the framework and some of its benefits and limitations.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", generalterms = "Design; Performance", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "business process redesign; organizational change; process representation", subject = "Computing Milieux --- Computers and Society --- Organizational Impacts (K.4.3)", } @Article{Carpineto:2001:ITA, author = "Claudio Carpineto and Renato de Mori and Giovanni Romano and Brigitte Bigi", title = "An information-theoretic approach to automatic query expansion", journal = j-TOIS, volume = "19", number = "1", pages = "1--27", year = "2001", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Tue Apr 17 08:17:10 MDT 2001", bibsource = "http://www.acm.org/pubs/toc/; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org/pubs/articles/journals/tois/2001-19-1/p1-carpineto/p1-carpineto.pdf; http://www.acm.org/pubs/citations/journals/tois/2001-19-1/p1-carpineto/", abstract = "Techniques for automatic query expansion from top retrieved documents have shown promise for improving retrieval effectiveness on large collections; however, they often rely on an empirical ground, and there is a shortage of cross-system comparisons. Using ideas from Information Theory, we present a computationally simple and theoretically justified method for assigning scores to candidate expansion terms. Such scores are used to select and weight expansion terms within Rocchio's framework for query reweighting. We compare ranking with information-theoretic query expansion versus ranking with other query expansion techniques, showing that the former achieves better retrieval effectiveness on several performance measures. We also discuss the effect on retrieval effectiveness of the main parameters involved in automatic query expansion, such as data sparseness, query difficulty, number of selected documents, and number of selected terms, pointing out interesting relationships.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", generalterms = "Algorithms; Design; Experimentation; Theory", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "automatic query expansion; information retrieval; information theory; pseudorelevance feedback", subject = "Information Systems --- Information Storage and Retrieval --- Information Search and Retrieval (H.3.3): {\bf Retrieval models}; Information Systems --- Information Storage and Retrieval --- Information Search and Retrieval (H.3.3): {\bf Relevance feedback}; Information Systems --- Information Storage and Retrieval --- Information Search and Retrieval (H.3.3): {\bf Query formulation}; Information Systems --- Information Storage and Retrieval --- Content Analysis and Indexing (H.3.1): {\bf Indexing methods}", } @Article{deOliveira:2001:SBM, author = "Maria Cristina Ferreira de Oliveira and Marcelo Augusto Santos Turine and Paulo Cesar Masiero", title = "A statechart-based model for hypermedia applications", journal = j-TOIS, volume = "19", number = "1", pages = "28--52", year = "2001", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Tue Apr 17 08:17:10 MDT 2001", bibsource = "http://www.acm.org/pubs/toc/; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org/pubs/articles/journals/tois/2001-19-1/p28-de_oliveira/p28-de_oliveira.pdf; http://www.acm.org/pubs/citations/journals/tois/2001-19-1/p28-de_oliveira/", abstract = "This paper presents a formal definition for HMBS (Hypermedia Model Based on Statecharts). HMBS uses the structure and execution semantics of statecharts to specify both the structural organization and the browsing semantics of hypermedia applications. Statecharts are an extension of finite-state machines and the model is thus a generalization of hypergraph-based hypertext models. Some of the most important features of HMBS are its ability to model hierarchy and synchronization of information; provision of mechanisms for specifying access structures, navigational contexts, access control, multiple tailored versions,and hierarchical views. Analysis of the underlying statechart machine allows verification of page reachability, valid paths, and other properties, thus providing mechanisms to support authors in the development of structured applications.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", generalterms = "Algorithms; Design; Languages; Theory", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "browsing semantics; HMBS; hypermedia specification; navigational model; statecharts", subject = "Theory of Computation --- Computation by Abstract Devices --- Models of Computation (F.1.1): {\bf Relations between models}; Computing Methodologies --- Document and Text Processing --- Document Preparation (I.7.2): {\bf Hypertext/hypermedia}; Information Systems --- Information Storage and Retrieval --- Information Search and Retrieval (H.3.3): {\bf Search process}; Information Systems --- Information Storage and Retrieval --- Systems and Software (H.3.4): {\bf Information networks}; Information Systems --- Information Interfaces and Presentation --- Multimedia Information Systems (H.5.1): {\bf Hypertext navigation and maps**}; Information Systems --- Information Interfaces and Presentation --- Hypertext/Hypermedia (H.5.4)", } @Article{Papadias:2001:AST, author = "Dimitris Papadias and Nikos Mamoulis and Vasilis Delis", title = "Approximate spatio-temporal retrieval", journal = j-TOIS, volume = "19", number = "1", pages = "53--96", year = "2001", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Tue Apr 17 08:17:10 MDT 2001", bibsource = "http://www.acm.org/pubs/toc/; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "http://www.acm.org/pubs/articles/journals/tois/2001-19-1/p53-papadias/p53-papadias.pdf; http://www.acm.org/pubs/citations/journals/tois/2001-19-1/p53-papadias/", abstract = "This paper proposes a framework for the handling of spatio-temporal queries with inexact matches, using the concept of relation similarity. We initially describe a binary string encoding for 1D relations that permits the automatic derivation of similarity measures. We then extend this model to various granularity levels and many dimensions, and show that reasoning on spatio-temporal structure is significantly facilitated in the new framework. Finally, we provide algorithms and optimization methods for four types of queries: (i) object retrieval based on some spatio-temporal relations with respect to a reference object, (ii) spatial joins, i.e., retrieval of object pairs that satisfy some input relation, (iii) structural queries, which retrieve configurations matching a particular spatio-temporal structure, and (iv) special cases of motion queries. Considering the current large availability of multidimensional data and the increasing need for flexible query-answering mechanisms, our techniques can be used as the core of spatio-temporal query processors.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", subject = "Information Systems --- Database Management --- Physical Design (H.2.2): {\bf Access methods}; Information Systems --- Database Management --- Systems (H.2.4): {\bf Multimedia databases}; Information Systems --- Database Management --- Database Applications (H.2.8): {\bf Spatial databases and GIS}", } @Article{Callan:2001:QBS, author = "Jamie Callan and Margaret Connell", title = "Query-based sampling of text databases", journal = j-TOIS, volume = "19", number = "2", pages = "97--130", month = apr, year = "2001", CODEN = "ATISET", DOI = "https://doi.org/10.1145/382979.383040", ISSN = "1046-8188", bibdate = "Thu Oct 1 16:56:41 MDT 2015", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The proliferation of searchable text databases on corporate networks and the Internet causes a database selection problem for many people. Algorithms such as gGLOSS and CORI can automatically select which text databases to search for a given information need, but only if given a set of resource descriptions that accurately represent the contents of each database. The existing techniques for a acquiring resource descriptions have significant limitations when used in wide-area networks controlled by many parties. This paper presents query-based sampling, a new technique for acquiring accurate resource descriptions. Query-based sampling does not require the cooperation of resource providers, nor does it require that resource providers use a particular search engine or representation technique. An extensive set of experimental results demonstrates that accurate resource descriptions are created, that computation and communication costs are reasonable, and that the resource descriptions do in fact enable accurate automatic database selection.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Lempel:2001:SSA, author = "R. Lempel and S. Moran", title = "{SALSA}: the stochastic approach for link-structure analysis", journal = j-TOIS, volume = "19", number = "2", pages = "131--160", month = apr, year = "2001", CODEN = "ATISET", DOI = "https://doi.org/10.1145/382979.383041", ISSN = "1046-8188", bibdate = "Thu Oct 1 16:56:41 MDT 2015", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Today, when searching for information on the WWW, one usually performs a query through a term-based search engine. These engines return, as the query's result, a list of Web pages whose contents matches the query. For broad-topic queries, such searches often result in a huge set of retrieved documents, many of which are irrelevant to the user. However, much information is contained in the link-structure of the WWW. Information such as which pages are linked to others can be used to augment search algorithms. In this context, Jon Kleinberg introduced the notion of two distinct types of Web pages: hubs and authorities. Kleinberg argued that hubs and authorities exhibit a mutually reinforcing relationship: a good hub will point to many authorities, and a good authority will be pointed at by many hubs. In light of this, he devised an algorithm aimed at finding authoritative pages. We present SALSA, a new stochastic approach for link-structure analysis, which examines random walks on graphs derived from the link-structure. We show that both SALSA and Kleinberg's Mutual Reinforcement approach employ the same metaalgorithm. We then prove that SALSA is equivalent to a weighted in degree analysis of the link-structure of WWW subgraphs, making it computationally more efficient than the Mutual reinforcement approach. We compare that results of applying SALSA to the results derived through Kleinberg's approach. These comparisons reveal a topological Phenomenon called the TKC effect which, in certain cases, prevents the Mutual reinforcement approach from identifying meaningful authorities.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Meuss:2001:CAA, author = "Holger Meuss and Klaus U. Schulz", title = "Complete answer aggregates for treelike databases: a novel approach to combine querying and navigation", journal = j-TOIS, volume = "19", number = "2", pages = "161--215", month = apr, year = "2001", CODEN = "ATISET", DOI = "https://doi.org/10.1145/382979.383042", ISSN = "1046-8188", bibdate = "Thu Oct 1 16:56:41 MDT 2015", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The use of markup languages like SGML, HTML or XML for encoding the structure of documents or linguistic data has lead to many databases where entries are adequately described as trees. In this context querying formalisms are interesting that offer the possibility to refer both to textual content and logical structure. We consider models where the structure specified in a query is not only used as a filter, but also for selecting and presenting different parts of the data. If answers are formalized as mapping from query nodes to the database, a simple enumeration of all mappings in the answer set will often suffer from the effect that many answers have common subparts. From a theoretical point of view this may lead to an exponential time complexity of the computation and presentation of all answers. Concentration on the language of so called tree queries-a variant and extension of Kilpel{\"a}inen's Tree Matching formalism-we introduce the notion of a ``complete answer aggregate'' for a given query. This new data structure offers a compact view of the set of all answer and supports active exploration of the answer space. Since complete answer aggregates use a powerful structure-sharing mechanism their maximal size is of order $ O(d \cdot h \cdot q) $ where $d$ and $q$ respectively denote the size of the database and the query, and $h$ is the maximal depth of a path of the database. An algorithm is given that computes a complete answer aggregate for a given tree query in time $ O(d \cdot \log (d) \cdot h \cdot q)$. For the sublanguage of so-called rigid tree queries, as well as for so-called ``nonrecursive'' databases, an improved bound of $ O (d \cdot \log (d) \cdot q)$ is obtained. The algorithm is based on a specific index structure that supports practical efficiency.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Melnik:2001:BDF, author = "Sergey Melnik and Sriram Raghavan and Beverly Yang and Hector Garcia-Molina", title = "Building a distributed full-text index for the {Web}", journal = j-TOIS, volume = "19", number = "3", pages = "217--241", month = jul, year = "2001", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Tue Feb 19 14:45:47 MST 2002", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Kwok:2001:SQA, author = "Cody Kwok and Oren Etzioni and Daniel S. Weld", title = "Scaling question answering to the {Web}", journal = j-TOIS, volume = "19", number = "3", pages = "242--262", month = jul, year = "2001", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Tue Feb 19 14:45:47 MST 2002", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Hong:2001:WPB, author = "Jason I. Hong and Jeffrey Heer and Sarah Waterson and James A. Landay", title = "{WebQuilt}: a proxy-based approach to remote web usability testing", journal = j-TOIS, volume = "19", number = "3", pages = "263--285", month = jul, year = "2001", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Tue Feb 19 14:45:47 MST 2002", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Aggarwal:2001:DLC, author = "Charu C. Aggarwal and Fatima Al-Garawi and Philip S. Yu", title = "On the design of a learning crawler for topical resource discovery", journal = j-TOIS, volume = "19", number = "3", pages = "286--309", month = jul, year = "2001", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Tue Feb 19 14:45:47 MST 2002", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Meng:2001:HSE, author = "Weiyi Meng and Zonghuan Wu and Clement Yu and Zhuogang Li", title = "A highly scalable and effective method for metasearch", journal = j-TOIS, volume = "19", number = "3", pages = "310--335", month = jul, year = "2001", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Tue Feb 19 14:45:47 MST 2002", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Wong:2001:AAF, author = "Kam-Fai Wong and Dawei Song and Peter Bruza and Chun-Hung Cheng", title = "Application of aboutness to functional benchmarking in information retrieval", journal = j-TOIS, volume = "19", number = "4", pages = "337--370", month = oct, year = "2001", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Tue Feb 19 14:45:47 MST 2002", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Comai:2001:CGQ, author = "Sara Comai and Ernesto Damiani and Piero Fraternali", title = "Computing graphical queries over {XML} data", journal = j-TOIS, volume = "19", number = "4", pages = "371--430", month = oct, year = "2001", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Tue Feb 19 14:45:47 MST 2002", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Yoshioka:2001:GTK, author = "Takeshi Yoshioka and George Herman and JoAnne Yates and Wanda Orlikowski", title = "Genre taxonomy: a knowledge repository of communicative actions", journal = j-TOIS, volume = "19", number = "4", pages = "431--456", month = oct, year = "2001", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Tue Feb 19 14:45:47 MST 2002", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Lempel:2002:PPA, author = "Ronny Lempel and Aya Soffer", title = "{PicASHOW}: {Pictorial} authority search by hyperlinks on the {Web}", journal = j-TOIS, volume = "20", number = "1", pages = "1--24", month = jan, year = "2002", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Thu Aug 7 10:37:11 MDT 2003", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Aridor:2002:KEF, author = "Yariv Aridor and David Carmel and Yoelle S. Maarek and Aya Soffer and Ronny Lempel", title = "Knowledge encapsulation for focused search from pervasive devices", journal = j-TOIS, volume = "20", number = "1", pages = "25--46", month = jan, year = "2002", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Thu Aug 7 10:37:11 MDT 2003", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Bharat:2002:WEA, author = "Krishna Bharat and George A. Mihaila", title = "When experts agree: using non-affiliated experts to rank popular topics", journal = j-TOIS, volume = "20", number = "1", pages = "47--58", month = jan, year = "2002", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Thu Aug 7 10:37:11 MDT 2003", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Wen:2002:QCU, author = "Ji-Rong Wen and Jian-Yun Nie and Hong-Jiang Zhang", title = "Query clustering using user logs", journal = j-TOIS, volume = "20", number = "1", pages = "59--81", month = jan, year = "2002", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Thu Aug 7 10:37:11 MDT 2003", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Buyukkokten:2002:EWB, author = "Orkut Buyukkokten and Oliver Kaljuvee and Hector Garcia-Molina and Andreas Paepcke and Terry Winograd", title = "Efficient {Web} browsing on handheld devices using page and form summarization", journal = j-TOIS, volume = "20", number = "1", pages = "82--115", month = jan, year = "2002", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Thu Aug 7 10:37:11 MDT 2003", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Finkelstein:2002:PSC, author = "Lev Finkelstein and Evgeniy Gabrilovich and Yossi Matias and Ehud Rivlin and Zach Solan and Gadi Wolfman and Eytan Ruppin", title = "Placing search in context: The concept revisited", journal = j-TOIS, volume = "20", number = "1", pages = "116--131", month = jan, year = "2002", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Thu Aug 7 10:37:11 MDT 2003", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Cooper:2002:PPD, author = "Brian F. Cooper and Hector Garcia-Molina", title = "Peer-to-peer data trading to preserve information", journal = j-TOIS, volume = "20", number = "2", pages = "133--170", year = "2002", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Thu Aug 7 10:37:11 MDT 2003", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Chowdhury:2002:CSF, author = "Abdur Chowdhury and Ophir Frieder and David Grossman and Mary Catherine McCabe", title = "Collection statistics for fast duplicate document detection", journal = j-TOIS, volume = "20", number = "2", pages = "171--191", year = "2002", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Thu Aug 7 10:37:11 MDT 2003", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Heinz:2002:BTF, author = "Steffen Heinz and Justin Zobel and Hugh E. Williams", title = "Burst tries: a fast, efficient data structure for string keys", journal = j-TOIS, volume = "20", number = "2", pages = "192--223", year = "2002", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Thu Aug 7 10:37:11 MDT 2003", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Zhu:2002:TKB, author = "Lei Zhu and Aibing Rao and Aidong Zhang", title = "Theory of keyblock-based image retrieval", journal = j-TOIS, volume = "20", number = "2", pages = "224--257", year = "2002", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Thu Aug 7 10:37:11 MDT 2003", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Carpineto:2002:IRF, author = "Claudio Carpineto and Giovanni Romano and Vittorio Giannini", title = "Improving retrieval feedback with multiple term-ranking function combination", journal = j-TOIS, volume = "20", number = "3", pages = "259--290", year = "2002", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Thu Aug 7 10:37:12 MDT 2003", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Owei:2002:IAH, author = "Vesper Owei", title = "An intelligent approach to handling imperfect information in concept-based natural language queries", journal = j-TOIS, volume = "20", number = "3", pages = "291--328", year = "2002", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Thu Aug 7 10:37:12 MDT 2003", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Cannane:2002:GPC, author = "Adam Cannane and Hugh E. Williams", title = "A general-purpose compression scheme for large collections", journal = j-TOIS, volume = "20", number = "3", pages = "329--355", year = "2002", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Thu Aug 7 10:37:12 MDT 2003", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Amati:2002:PMI, author = "Gianni Amati and Cornelis Joost {Van Rijsbergen}", title = "Probabilistic models of information retrieval based on measuring the divergence from randomness", journal = j-TOIS, volume = "20", number = "4", pages = "357--389", year = "2002", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Thu Aug 7 10:37:12 MDT 2003", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Feng:2002:SNB, author = "Ling Feng and Elizabeth Chang and Tharam Dillon", title = "A semantic network-based design methodology for {XML} documents", journal = j-TOIS, volume = "20", number = "4", pages = "390--421", year = "2002", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Thu Aug 7 10:37:12 MDT 2003", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Jarvelin:2002:CGB, author = "Kalervo J{\"a}rvelin and Jaana Kek{\"a}l{\"a}inen", title = "Cumulated gain-based evaluation of {IR} techniques", journal = j-TOIS, volume = "20", number = "4", pages = "422--446", year = "2002", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Thu Aug 7 10:37:12 MDT 2003", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Gravano:2003:QSA, author = "Luis Gravano and Panagiotis G. Ipeirotis and Mehran Sahami", title = "{QProber}: a system for automatic classification of hidden-{Web} databases", journal = j-TOIS, volume = "21", number = "1", pages = "1--41", year = "2003", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Thu Aug 7 10:37:13 MDT 2003", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Calado:2003:LVG, author = "P{\'a}vel Calado and Berthier Ribeiro-Neto and Nivio Ziviani and Edleno Moura and Ilm{\'e}rio Silva", title = "Local versus global link information in the {Web}", journal = j-TOIS, volume = "21", number = "1", pages = "42--63", year = "2003", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Thu Aug 7 10:37:13 MDT 2003", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Ganesan:2003:EHD, author = "Prasanna Ganesan and Hector Garcia-Molina and Jennifer Widom", title = "Exploiting hierarchical domain structure to compute similarity", journal = j-TOIS, volume = "21", number = "1", pages = "64--93", year = "2003", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Thu Aug 7 10:37:13 MDT 2003", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Conrad:2003:EUS, author = "Jack G. Conrad and Joanne R. S. Claussen", title = "Early user--system interaction for database selection in massive domain-specific online environments", journal = j-TOIS, volume = "21", number = "1", pages = "94--131", year = "2003", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Thu Aug 7 10:37:13 MDT 2003", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Moldovan:2003:PIE, author = "Dan Moldovan and Marius Pa{\c{s}}ca and Sanda Harabagiu and Mihai Surdeanu", title = "Performance issues and error analysis in an open-domain question answering system", journal = j-TOIS, volume = "21", number = "2", pages = "133--154", year = "2003", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Thu Aug 7 10:37:13 MDT 2003", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Bertino:2003:HAC, author = "Elisa Bertino and Jianping Fan and Elena Ferrari and Mohand-Said Hacid and Ahmed K. Elmagarmid and Xingquan Zhu", title = "A hierarchical access control model for video database systems", journal = j-TOIS, volume = "21", number = "2", pages = "155--191", year = "2003", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Thu Aug 7 10:37:13 MDT 2003", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Amato:2003:RPM, author = "Giuseppe Amato and Fausto Rabitti and Pasquale Savino and Pavel Zezula", title = "Region proximity in metric spaces and its use for approximate similarity search", journal = j-TOIS, volume = "21", number = "2", pages = "192--227", year = "2003", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Thu Aug 7 10:37:13 MDT 2003", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Leroy:2003:UDC, author = "Gondy Leroy and Ann M. Lally and Hsinchun Chen", title = "The use of dynamic contexts to improve casual {Internet} searching", journal = j-TOIS, volume = "21", number = "3", pages = "229--253", month = jul, year = "2003", CODEN = "ATISET", DOI = "https://doi.org/10.1145/858476.858477", ISSN = "1046-8188", bibdate = "Wed Jul 16 17:24:06 MDT 2014", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Research has shown that most users' online information searches are suboptimal. Query optimization based on a relevance feedback or genetic algorithm using dynamic query contexts can help casual users search the Internet. These algorithms can draw on implicit user feedback based on the surrounding links and text in a search engine result set to expand user queries with a variable number of keywords in two manners. Positive expansion adds terms to a user's keywords with a Boolean ``and,'' negative expansion adds terms to the user's keywords with a Boolean ``not.'' Each algorithm was examined for three user groups, high, middle, and low achievers, who were classified according to their overall performance. The interactions of users with different levels of expertise with different expansion types or algorithms were evaluated. The genetic algorithm with negative expansion tripled recall and doubled precision for low achievers, but high achievers displayed an opposed trend and seemed to be hindered in this condition. The effect of other conditions was less substantial.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Bolchini:2003:LPD, author = "Cristiana Bolchini and Fabio Salice and Fabio A. Schreiber and Letizia Tanca", title = "Logical and physical design issues for smart card databases", journal = j-TOIS, volume = "21", number = "3", pages = "254--285", month = jul, year = "2003", CODEN = "ATISET", DOI = "https://doi.org/10.1145/858476.858478", ISSN = "1046-8188", bibdate = "Wed Jul 16 17:24:06 MDT 2014", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The design of very small databases for smart cards and for portable embedded systems is deeply constrained by the peculiar features of the physical medium. We propose a joint approach to the logical and physical database design phases and evaluate several data structures with respect to the performance, power consumption, and endurance parameters of read/program operations on the Flash-EEPROM storage medium.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Upstill:2003:QIE, author = "Trystan Upstill and Nick Craswell and David Hawking", title = "Query-independent evidence in home page finding", journal = j-TOIS, volume = "21", number = "3", pages = "286--313", month = jul, year = "2003", CODEN = "ATISET", DOI = "https://doi.org/10.1145/858476.858479", ISSN = "1046-8188", bibdate = "Wed Jul 16 17:24:06 MDT 2014", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Hyperlink recommendation evidence, that is, evidence based on the structure of a web's link graph, is widely exploited by commercial Web search systems. However there is little published work to support its popularity. Another form of query-independent evidence, URL-type, has been shown to be beneficial on a home page finding task. We compared the usefulness of these types of evidence on the home page finding task, combined with both content and anchor text baselines. Our experiments made use of five query sets spanning three corpora---one enterprise crawl, and the WT10g and VLC2 Web test collections.We found that, in optimal conditions, all of the query-independent methods studied (in-degree, URL-type, and two variants of PageRank) offered a better than random improvement on a content-only baseline. However, only URL-type offered a better than random improvement on an anchor text baseline. In realistic settings, for either baseline, only URL-type offered consistent gains. In combination with URL-type the anchor text baseline was more useful for finding popular home pages, but URL-type with content was more useful for finding randomly selected home pages. We conclude that a general home page finding system should combine evidence from document content, anchor text, and URL-type classification.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Turney:2003:MPC, author = "Peter D. Turney and Michael L. Littman", title = "Measuring praise and criticism: {Inference} of semantic orientation from association", journal = j-TOIS, volume = "21", number = "4", pages = "315--346", month = oct, year = "2003", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Fri Oct 31 06:13:42 MST 2003", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Chang:2003:MME, author = "Edward Chang and Beitao Li", title = "{MEGA}---the maximizing expected generalization algorithm for learning complex query concepts", journal = j-TOIS, volume = "21", number = "4", pages = "347--382", month = oct, year = "2003", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Fri Oct 31 06:13:42 MST 2003", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Eastman:2003:CRR, author = "Caroline M. Eastman and Bernard J. Jansen", title = "Coverage, relevance, and ranking: {The} impact of query operators on {Web} search engine results", journal = j-TOIS, volume = "21", number = "4", pages = "383--411", month = oct, year = "2003", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Fri Oct 31 06:13:42 MST 2003", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Powell:2003:CPC, author = "Allison L. Powell and James C. French", title = "Comparing the performance of collection selection algorithms", journal = j-TOIS, volume = "21", number = "4", pages = "412--456", month = oct, year = "2003", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Fri Oct 31 06:13:42 MST 2003", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Si:2003:SLM, author = "Luo Si and Jamie Callan", title = "A semisupervised learning method to merge search engine results", journal = j-TOIS, volume = "21", number = "4", pages = "457--491", month = oct, year = "2003", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Fri Oct 31 06:13:42 MST 2003", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Staff:2003:TR, author = "{ACM Transactions on Information Systems Staff}", title = "{TOIS} reviewers", journal = j-TOIS, volume = "21", number = "4", pages = "492--493", month = oct, year = "2003", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Fri Oct 31 06:13:42 MST 2003", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Konstan:2004:IRS, author = "Joseph A. Konstan", title = "Introduction to recommender systems: Algorithms and Evaluation", journal = j-TOIS, volume = "22", number = "1", pages = "1--4", month = jan, year = "2004", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sun Jan 11 10:24:10 MST 2004", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Herlocker:2004:ECF, author = "Jonathan L. Herlocker and Joseph A. Konstan and Loren G. Terveen and John T. Riedl", title = "Evaluating collaborative filtering recommender systems", journal = j-TOIS, volume = "22", number = "1", pages = "5--53", month = jan, year = "2004", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sun Jan 11 10:24:10 MST 2004", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Middleton:2004:OUP, author = "Stuart E. Middleton and Nigel R. Shadbolt and David C. De Roure", title = "Ontological user profiling in recommender systems", journal = j-TOIS, volume = "22", number = "1", pages = "54--88", month = jan, year = "2004", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sun Jan 11 10:24:10 MST 2004", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Hofmann:2004:LSM, author = "Thomas Hofmann", title = "Latent semantic models for collaborative filtering", journal = j-TOIS, volume = "22", number = "1", pages = "89--115", month = jan, year = "2004", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sun Jan 11 10:24:10 MST 2004", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Huang:2004:AAR, author = "Zan Huang and Hsinchun Chen and Daniel Zeng", title = "Applying associative retrieval techniques to alleviate the sparsity problem in collaborative filtering", journal = j-TOIS, volume = "22", number = "1", pages = "116--142", month = jan, year = "2004", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sun Jan 11 10:24:10 MST 2004", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Deshpande:2004:IBT, author = "Mukund Deshpande and George Karypis", title = "Item-based top-{$N$} recommendation algorithms", journal = j-TOIS, volume = "22", number = "1", pages = "143--177", month = jan, year = "2004", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sun Jan 11 10:24:10 MST 2004", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Zhai:2004:SSM, author = "Chengxiang Zhai and John Lafferty", title = "A study of smoothing methods for language models applied to information retrieval", journal = j-TOIS, volume = "22", number = "2", pages = "179--214", month = apr, year = "2004", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Thu Nov 4 08:03:37 MST 2004", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Mana-Lopez:2004:MSA, author = "Manuel J. Ma{\~n}a-L{\'o}pez and Manuel {De Buenaga} and Jos{\'e} M. G{\'o}mez-Hidalgo", title = "Multidocument summarization: an added value to clustering in interactive retrieval", journal = j-TOIS, volume = "22", number = "2", pages = "215--241", month = apr, year = "2004", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Thu Nov 4 08:03:37 MST 2004", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Lu:2004:ATM, author = "Wen-Hsiang Lu and Lee-Feng Chien and Hsi-Jian Lee", title = "Anchor text mining for translation of {Web} queries: {A} transitive translation approach", journal = j-TOIS, volume = "22", number = "2", pages = "242--269", month = apr, year = "2004", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Thu Nov 4 08:03:37 MST 2004", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Goncalves:2004:SSS, author = "Marcos Andr{\'e} Gon{\c{c}}alves and Edward A. Fox and Layne T. Watson and Neill A. Kipp", title = "Streams, structures, spaces, scenarios, societies (5s): a formal model for digital libraries", journal = j-TOIS, volume = "22", number = "2", pages = "270--312", month = apr, year = "2004", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Thu Nov 4 08:03:37 MST 2004", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Fuhr:2004:XXQ, author = "Norbert Fuhr and Kai Gro{\ss}johann", title = "{XIRQL}: {An XML} query language based on information retrieval concepts", journal = j-TOIS, volume = "22", number = "2", pages = "313--356", month = apr, year = "2004", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Thu Nov 4 08:03:37 MST 2004", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Bodoff:2004:RMH, author = "David Bodoff", title = "Relevance models to help estimate document and query parameters", journal = j-TOIS, volume = "22", number = "3", pages = "357--380", month = jul, year = "2004", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Thu Nov 4 08:03:37 MST 2004", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Wu:2004:EMB, author = "Xindong Wu and Chengqi Zhang and Shichao Zhang", title = "Efficient mining of both positive and negative association rules", journal = j-TOIS, volume = "22", number = "3", pages = "381--405", month = jul, year = "2004", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Thu Nov 4 08:03:37 MST 2004", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Gladney:2004:TYD, author = "Henry M. Gladney", title = "Trustworthy 100-year digital objects: {Evidence} after every witness is dead", journal = j-TOIS, volume = "22", number = "3", pages = "406--436", month = jul, year = "2004", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Thu Nov 4 08:03:37 MST 2004", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Miller:2004:PTP, author = "Bradley N. Miller and Joseph A. Konstan and John Riedl", title = "{PocketLens}: {Toward} a personal recommender system", journal = j-TOIS, volume = "22", number = "3", pages = "437--476", month = jul, year = "2004", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Thu Nov 4 08:03:37 MST 2004", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{King:2004:DCB, author = "Irwin King and Cheuk Hang Ng and Ka Cheung Sia", title = "Distributed content-based visual information retrieval system on peer-to-peer networks", journal = j-TOIS, volume = "22", number = "3", pages = "477--501", month = jul, year = "2004", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Thu Nov 4 08:03:37 MST 2004", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Brafman:2004:QDM, author = "Ronen I. Brafman and Carmel Domshlak and Solomon E. Shimony", title = "Qualitative decision making in adaptive presentation of structured information", journal = j-TOIS, volume = "22", number = "4", pages = "503--539", month = oct, year = "2004", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Thu Nov 4 08:03:37 MST 2004", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Park:2004:ALS, author = "Seung-Taek Park and David M. Pennock and C. Lee Giles and Robert Krovetz", title = "Analysis of lexical signatures for improving information persistence on the {World Wide Web}", journal = j-TOIS, volume = "22", number = "4", pages = "540--572", month = oct, year = "2004", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Thu Nov 4 08:03:37 MST 2004", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Williams:2004:FPQ, author = "Hugh E. Williams and Justin Zobel and Dirk Bahle", title = "Fast phrase querying with combined indexes", journal = j-TOIS, volume = "22", number = "4", pages = "573--594", month = oct, year = "2004", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Thu Nov 4 08:03:37 MST 2004", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Park:2004:ISI, author = "Jinsoo Park and Sudha Ram", title = "Information systems interoperability: {What} lies beneath?", journal = j-TOIS, volume = "22", number = "4", pages = "595--632", month = oct, year = "2004", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Thu Nov 4 08:03:37 MST 2004", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Williams:2005:IGI, author = "Hugh E. Williams", title = "Introduction to genomic information retrieval", journal = j-TOIS, volume = "23", number = "1", pages = "1--2", month = jan, year = "2005", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Tue Apr 12 07:07:01 MDT 2005", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Korodi:2005:ENM, author = "Gergely Korodi and Ioan Tabus", title = "An efficient normalized maximum likelihood algorithm for {DNA} sequence compression", journal = j-TOIS, volume = "23", number = "1", pages = "3--34", month = jan, year = "2005", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Tue Apr 12 07:07:01 MDT 2005", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Sander:2005:MAS, author = "J{\"o}rg Sander and Raymond T. Ng and Monica C. Sleumer and Man Saint Yuen and Steven J. Jones", title = "A methodology for analyzing {SAGE} libraries for cancer profiling", journal = j-TOIS, volume = "23", number = "1", pages = "35--60", month = jan, year = "2005", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Tue Apr 12 07:07:01 MDT 2005", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Tao:2005:HST, author = "Yufei Tao and Dimitris Papadias", title = "Historical spatio-temporal aggregation", journal = j-TOIS, volume = "23", number = "1", pages = "61--102", month = jan, year = "2005", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Tue Apr 12 07:07:01 MDT 2005", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Adomavicius:2005:ICI, author = "Gediminas Adomavicius and Ramesh Sankaranarayanan and Shahana Sen and Alexander Tuzhilin", title = "Incorporating contextual information in recommender systems using a multidimensional approach", journal = j-TOIS, volume = "23", number = "1", pages = "103--145", month = jan, year = "2005", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Tue Apr 12 07:07:01 MDT 2005", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Fox:2005:EIM, author = "Steve Fox and Kuldeep Karnawat and Mark Mydland and Susan Dumais and Thomas White", title = "Evaluating implicit measures to improve {Web} search", journal = j-TOIS, volume = "23", number = "2", pages = "147--168", month = apr, year = "2005", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Tue Apr 26 17:34:31 MDT 2005", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Cooper:2005:AHS, author = "Brian F. Cooper and Hector Garcia-Molina", title = "Ad hoc, self-supervising peer-to-peer search networks", journal = j-TOIS, volume = "23", number = "2", pages = "169--200", month = apr, year = "2005", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Tue Apr 26 17:34:31 MDT 2005", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Xu:2005:CEF, author = "Jennifer J. Xu and Hsinchun Chen", title = "{CrimeNet} explorer: a framework for criminal network knowledge discovery", journal = j-TOIS, volume = "23", number = "2", pages = "201--226", month = apr, year = "2005", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Tue Apr 26 17:34:31 MDT 2005", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Wei:2005:MBA, author = "Yan Zheng Wei and Luc Moreau and Nicholas R. Jennings", title = "A market-based approach to recommender systems", journal = j-TOIS, volume = "23", number = "3", pages = "227--266", month = jul, year = "2005", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Thu Sep 22 11:21:45 MDT 2005", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Park:2005:NDR, author = "Laurence A. F. Park and Kotagiri Ramamohanarao and Marimuthu Palaniswami", title = "A novel document retrieval method using the discrete wavelet transform", journal = j-TOIS, volume = "23", number = "3", pages = "267--298", month = jul, year = "2005", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Thu Sep 22 11:21:45 MDT 2005", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Gladney:2005:TYD, author = "H. M. Gladney and R. A. Lorie", title = "Trustworthy 100-year digital objects: durable encoding for when it's too late to ask", journal = j-TOIS, volume = "23", number = "3", pages = "299--324", month = jul, year = "2005", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Thu Sep 22 11:21:45 MDT 2005", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{White:2005:EIF, author = "Ryen W. White and Ian Ruthven and Joemon M. Jose and C. J. {Van Rijsbergen}", title = "Evaluating implicit feedback models using searcher simulations", journal = j-TOIS, volume = "23", number = "3", pages = "325--361", month = jul, year = "2005", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Thu Sep 22 11:21:45 MDT 2005", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Chuang:2005:TGT, author = "Shui-Lung Chuang and Lee-Feng Chien", title = "Taxonomy generation for text segments: a practical {Web}-based approach", journal = j-TOIS, volume = "23", number = "4", pages = "363--396", month = oct, year = "2005", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Tue Oct 25 06:41:53 MDT 2005", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Possas:2005:SBV, author = "Bruno P{\^o}ssas and Nivio Ziviani and Wagner {Meira, Jr.} and Berthier Ribeiro-Neto", title = "Set-based vector model: an efficient approach for correlation-based ranking", journal = j-TOIS, volume = "23", number = "4", pages = "397--429", month = oct, year = "2005", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Tue Oct 25 06:41:53 MDT 2005", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Pant:2005:LCC, author = "Gautam Pant and Padmini Srinivasan", title = "Learning to crawl: {Comparing} classification schemes", journal = j-TOIS, volume = "23", number = "4", pages = "430--462", month = oct, year = "2005", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Tue Oct 25 06:41:53 MDT 2005", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Ivory:2005:EWS, author = "Melody Y. Ivory and Rodrick Megraw", title = "Evolution of {Web} site design patterns", journal = j-TOIS, volume = "23", number = "4", pages = "463--497", month = oct, year = "2005", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Tue Oct 25 06:41:53 MDT 2005", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Zobel:2006:DVS, author = "J. Zobel", title = "Detection of video sequences using compact signatures", journal = j-TOIS, volume = "24", number = "1", pages = "1--50", month = jan, year = "2006", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1125857.1125858", ISSN = "1046-8188", bibdate = "Sat Apr 22 06:10:51 MDT 2006", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Fagni:2006:BPW, author = "Tiziano Fagni and Raffaele Perego and Fabrizio Silvestri and Salvatore Orlando", title = "Boosting the performance of {Web} search engines: {Caching} and prefetching query results by exploiting historical usage data", journal = j-TOIS, volume = "24", number = "1", pages = "51--78", month = jan, year = "2006", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1125857.1125859", ISSN = "1046-8188", bibdate = "Sat Apr 22 06:10:51 MDT 2006", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Qian:2006:SPB, author = "Gang Qian and Qiang Zhu and Qiang Xue and Sakti Pramanik", title = "A space-partitioning-based indexing method for multidimensional non-ordered discrete data spaces", journal = j-TOIS, volume = "24", number = "1", pages = "79--110", month = jan, year = "2006", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1125857.1125860", ISSN = "1046-8188", bibdate = "Sat Apr 22 06:10:51 MDT 2006", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{McDonald:2006:SCS, author = "Daniel M. McDonald and Hsinchun Chen", title = "Summary in context: {Searching} versus browsing", journal = j-TOIS, volume = "24", number = "1", pages = "111--141", month = jan, year = "2006", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1125857.1125861", ISSN = "1046-8188", bibdate = "Sat Apr 22 06:10:51 MDT 2006", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Marchionini:2006:TR, author = "Gary Marchionini", title = "{TOIS} reviewers 2003--2005", journal = j-TOIS, volume = "24", number = "1", pages = "142--143", month = jan, year = "2006", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1125857.1125862", ISSN = "1046-8188", bibdate = "Sat Apr 22 06:10:51 MDT 2006", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Lee:2006:UEF, author = "Hyowon Lee and Alan F. Smeaton and Noel E. O'Connor and Barry Smyth", title = "User evaluation of {F{\'\i}schl{\'a}r-News}: an automatic broadcast news delivery system", journal = j-TOIS, volume = "24", number = "2", pages = "145--189", month = apr, year = "2006", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Wed Aug 23 09:31:12 MDT 2006", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Gao:2006:MFM, author = "Sheng Gao and Wen Wu and Chin-Hui Lee and Tat-Seng Chua", title = "A maximal figure-of-merit {(MFoM)-learning} approach to robust classifier design for text categorization", journal = j-TOIS, volume = "24", number = "2", pages = "190--218", month = apr, year = "2006", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Wed Aug 23 09:31:12 MDT 2006", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Zhou:2006:ERF, author = "Zhi-Hua Zhou and Ke-Jia Chen and Hong-Bin Dai", title = "Enhancing relevance feedback in image retrieval using unlabeled data", journal = j-TOIS, volume = "24", number = "2", pages = "219--244", month = apr, year = "2006", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Wed Aug 23 09:31:12 MDT 2006", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Chen:2006:IIV, author = "Keke Chen and Ling Liu", title = "{iVIBRATE}: {Interactive} visualization-based framework for clustering large datasets", journal = j-TOIS, volume = "24", number = "2", pages = "245--294", month = apr, year = "2006", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Wed Aug 23 09:31:12 MDT 2006", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Jiang:2006:ECR, author = "Jing Jiang and Chengxiang Zhai", title = "Extraction of coherent relevant passages using hidden {Markov} models", journal = j-TOIS, volume = "24", number = "3", pages = "295--319", month = jul, year = "2006", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1165774.1165775", ISSN = "1046-8188", bibdate = "Wed Oct 11 07:12:08 MDT 2006", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Shen:2006:QEW, author = "Dou Shen and Rong Pan and Jian-Tao Sun and Jeffrey Junfeng Pan and Kangheng Wu and Jie Yin and Qiang Yang", title = "Query enrichment for web-query classification", journal = j-TOIS, volume = "24", number = "3", pages = "320--352", month = jul, year = "2006", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1165774.1165776", ISSN = "1046-8188", bibdate = "Wed Oct 11 07:12:08 MDT 2006", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Tsai:2006:CMS, author = "Chih-Fong Tsai and Ken McGarry and John Tait", title = "{CLAIRE}: a modular support vector image indexing and classification system", journal = j-TOIS, volume = "24", number = "3", pages = "353--379", month = jul, year = "2006", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1165774.1165777", ISSN = "1046-8188", bibdate = "Wed Oct 11 07:12:08 MDT 2006", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Yu:2006:LSC, author = "Hong Yu and Won Kim and Vasileios Hatzivassiloglou and John Wilbur", title = "A large scale, corpus-based approach for automatically disambiguating biomedical abbreviations", journal = j-TOIS, volume = "24", number = "3", pages = "380--404", month = jul, year = "2006", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1165774.1165778", ISSN = "1046-8188", bibdate = "Wed Oct 11 07:12:08 MDT 2006", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Abbreviations and acronyms are widely used in the biomedical literature and many of them represent important biomedical concepts. Because many abbreviations are ambiguous (e.g., CAT denotes both chloramphenicol acetyl transferase and computed axial tomography, depending on the context), recognizing the full form associated with each abbreviation is in most cases equivalent to identifying the meaning of the abbreviation. This, in turn, allows us to perform more accurate natural language processing, information extraction, and retrieval. In this study, we have developed supervised approaches to identifying the full forms of ambiguous abbreviations within the context they appear. We first automatically assigned multiple possible full forms for each abbreviation; we then treated the in-context full-form prediction for each specific abbreviation occurrence as a case of word-sense disambiguation. We generated automatically a dictionary of all possible full forms for each abbreviation. We applied supervised machine-learning algorithms for disambiguation. Because some of the links between abbreviations and their corresponding full forms are explicitly given in the text and can be recovered automatically, we can use these explicit links to automatically provide training data for disambiguating the abbreviations that are not linked to a full form within a text. We evaluated our methods on over 150 thousand abstracts and obtain for coverage and precision results of 82\% and 92\%, respectively, when performed as tenfold cross-validation, and 79\% and 80\%, respectively, when evaluated against an external set of abstracts in which the abbreviations are not defined.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Baeza-Yates:2006:ISI, author = "Ricardo Baeza-Yates and Norbert Fuhr and Yoelle Maarek", title = "Introduction to the special issue on {XML} retrieval", journal = j-TOIS, volume = "24", number = "4", pages = "405--406", month = oct, year = "2006", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1185877.1185878", ISSN = "1046-8188", bibdate = "Thu Jun 12 16:51:35 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Kamps:2006:AIN, author = "Jaap Kamps and Maarten Marx and Maarten de Rijke and B{\"o}rkur Sigurbj{\"o}rnsson", title = "Articulating information needs in {XML} query languages", journal = j-TOIS, volume = "24", number = "4", pages = "407--436", month = oct, year = "2006", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1185877.1185879", ISSN = "1046-8188", bibdate = "Thu Jun 12 16:51:35 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Document-centric XML is a mixture of text and structure. With the increased availability of document-centric XML documents comes a need for query facilities in which both structural constraints and constraints on the content of the documents can be expressed. How does the expressiveness of languages for querying XML documents help users to express their information needs? We address this question from both an experimental and a theoretical point of view. Our experimental analysis compares a structure-ignorant with a structure-aware retrieval approach using the test suite of the INEX XML Retrieval Evaluation Initiative. Theoretically, we create two mathematical models of users' knowledge of a set of documents and define query languages which exactly fit these models. One of these languages corresponds to an XML version of fielded search, the other to the INEX query language. Our main experimental findings are: First, while structure is used in varying degrees of complexity, two-thirds of the queries can be expressed in a fielded-search-like format which does not use the hierarchical structure of the documents. Second, three-quarters of the queries use constraints on the context of the elements to be returned; these contextual constraints cannot be captured by ordinary keyword queries. Third, structure is used as a search hint, and not as a strict requirement, when judged against the underlying information need. Fourth, the use of structure in queries functions as a precision enhancing device.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Full-text XML querying; XML retrieval; XPath", } @Article{Crouch:2006:DER, author = "Carolyn J. Crouch", title = "Dynamic element retrieval in a structured environment", journal = j-TOIS, volume = "24", number = "4", pages = "437--454", month = oct, year = "2006", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1185877.1185880", ISSN = "1046-8188", bibdate = "Thu Jun 12 16:51:35 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "This research examines the feasibility of dynamic element retrieval in a structured environment. Structured documents and queries are represented in extended vector form, based on a modification of the basic vector space model suggested by Fox [1983]. A method for the dynamic retrieval of XML elements, which requires only a single indexing of the documents at the level of the basic indexing node, is presented. This method, which we refer to as flexible retrieval, produces a rank ordered list of retrieved elements that is equivalent to the result produced by the same retrieval against an all-element index of the collection. Flexible retrieval obviates the need for storing either an all-element index or multiple indices of the collection.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "dynamic element retrieval; flexible retrieval; structured retrieval; vector space model; XML", } @Article{Lehtonen:2006:PHX, author = "Miro Lehtonen", title = "Preparing heterogeneous {XML} for full-text search", journal = j-TOIS, volume = "24", number = "4", pages = "455--474", month = oct, year = "2006", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1185877.1185881", ISSN = "1046-8188", bibdate = "Thu Jun 12 16:51:35 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "XML retrieval is facing new challenges when applied to heterogeneous XML documents, where next to nothing about the document structure can be taken for granted. We have developed solutions where some of the heterogeneity issues are addressed. Our fragment selection algorithm selectively divides a heterogeneous document collection into equi-sized fragments with full-text content. If the content is considered too data-oriented, it is not accepted. The algorithm needs no information about element names. In addition, three techniques for fragment expansion are presented, all of which yield a 13--17\% average improvement in average precision. These techniques and algorithms are among the first steps in developing document-type-independent indexing methods for the full text in heterogeneous XML collections.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "heterogeneous documents; indexing; XML retrieval", } @Article{Geneves:2006:SSA, author = "Pierre Genev{\`e}s and Nabil Laya{\"\i}da", title = "A system for the static analysis of {XPath}", journal = j-TOIS, volume = "24", number = "4", pages = "475--502", month = oct, year = "2006", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1185877.1185882", ISSN = "1046-8188", bibdate = "Thu Jun 12 16:51:35 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "XPath is the standard language for navigating XML documents and returning a set of matching nodes. We present a sound and complete decision procedure for containment of XPath queries, as well as other related XPath decision problems such as satisfiability, equivalence, overlap, and coverage. The considered XPath fragment covers most of the language features used in practice. Specifically, we propose a unifying logic for XML, namely, the alternation-free modal $\mu$-calculus with converse. We show how to translate major XML concepts such as XPath and regular XML types (including DTDs) into this logic. Based on these embeddings, we show how XPath decision problems, in the presence or absence of XML types, can be solved using a decision procedure for $\mu$-calculus satisfiability. We provide a complexity analysis of our system together with practical experiments to illustrate the efficiency of the approach for realistic scenarios.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Containment; equivalence; logic; query; XML; XPath", } @Article{Kazai:2006:ECG, author = "Gabriella Kazai and Mounia Lalmas", title = "{eXtended} cumulated gain measures for the evaluation of content-oriented {XML} retrieval", journal = j-TOIS, volume = "24", number = "4", pages = "503--542", month = oct, year = "2006", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1185877.1185883", ISSN = "1046-8188", bibdate = "Thu Jun 12 16:51:35 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "We propose and evaluate a family of measures, the eXtended Cumulated Gain (XCG) measures, for the evaluation of content-oriented XML retrieval approaches. Our aim is to provide an evaluation framework that allows the consideration of dependency among XML document components. In particular, two aspects of dependency are considered: (1) near-misses, which are document components that are structurally related to relevant components, such as a neighboring paragraph or container section, and (2) overlap, which regards the situation wherein the same text fragment is referenced multiple times, for example, when a paragraph and its container section are both retrieved. A further consideration is that the measures should be flexible enough so that different models of user behavior may be instantiated within. Both system- and user-oriented aspects are investigated and both recall and precision-like qualities are measured. We evaluate the reliability of the proposed measures based on the INEX 2004 test collection. For example, the effects of assessment variation and topic set size on evaluation stability are investigated, and the upper and lower bounds of expected error rates are established. The evaluation demonstrates that the XCG measures are stable and reliable, and in particular, that the novel measures of effort-precision and gain-recall ( ep / gr ) show comparable behavior to established IR measures like precision and recall.", acknowledgement = ack-nhfb, fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "cumulated gain; dependency; evaluation; INEX; metrics; near-miss; overlap; XML retrieval", } @Article{Piwowarski:2007:PRU, author = "B. Piwowarski and P. Gallinari and G. Dupret", title = "Precision recall with user modeling {(PRUM)}: {Application} to structured information retrieval", journal = j-TOIS, volume = "25", number = "1", pages = "1:1--1:??", month = feb, year = "2007", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1198296.1198297", ISSN = "1046-8188", bibdate = "Thu Jun 12 16:51:47 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Standard Information Retrieval (IR) metrics are not well suited for new paradigms like XML or Web IR in which retrievable information units are document elements and/or sets of related documents. Part of the problem stems from the classical hypotheses on the user models: They do not take into account the structural or logical context of document elements or the possibility of navigation between units. This article proposes an explicit and formal user model that encompasses a large variety of user behaviors. Based on this model, we extend the probabilistic precision-recall metric to deal with the new IR paradigms.", acknowledgement = ack-nhfb, articleno = "1", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Evaluation; information retrieval; measure; precision-recall; Web; XML", } @Article{Lam:2007:NET, author = "Wai Lam and Shing-Kit Chan and Ruizhang Huang", title = "Named entity translation matching and learning: {With} application for mining unseen translations", journal = j-TOIS, volume = "25", number = "1", pages = "2:1--2:??", month = feb, year = "2007", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1198296.1198298", ISSN = "1046-8188", bibdate = "Thu Jun 12 16:51:47 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "This article introduces a named entity matching model that makes use of both semantic and phonetic evidence. The matching of semantic and phonetic information is captured by a unified framework via a bipartite graph model. By considering various technical challenges of the problem, including order insensitivity and partial matching, this approach is less rigid than existing approaches and highly robust. One major component is a phonetic matching model which exploits similarity at the phoneme level. Two learning algorithms for learning the similarity information of basic phonemic matching units based on training examples are investigated. By applying the proposed named entity matching model, a mining system is developed for discovering new named entity translations from daily Web news. The system is able to discover new name translations that cannot be found in the existing bilingual dictionary.", acknowledgement = ack-nhfb, articleno = "2", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "learning phonetic information; named entity translation; Text mining", } @Article{Chai:2007:EIU, author = "Joyce Y. Chai and Chen Zhang and Rong Jin", title = "An empirical investigation of user term feedback in text-based targeted image search", journal = j-TOIS, volume = "25", number = "1", pages = "3:1--3:??", month = feb, year = "2007", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1198296.1198299", ISSN = "1046-8188", bibdate = "Thu Jun 12 16:51:47 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Text queries are natural and intuitive for users to describe their information needs. However, text-based image retrieval faces many challenges. Traditional text retrieval techniques on image descriptions have not been very successful. This is mainly due to the inconsistent textual descriptions and the discrepancies between user queries and terms in the descriptions. To investigate strategies to alleviate this vocabulary problem, this article examines the role of user term feedback in targeted image search that is based on text-based image retrieval. Term feedback refers to the feedback from a user on specific terms regarding their relevance to a target image. Previous studies have indicated the effectiveness of term feedback in interactive text retrieval. However, in our experiments on text-based image retrieval, the term feedback has not been shown to be effective. Our results indicate that, although term feedback has a positive effect by allowing users to identify more relevant terms, it also has a strong negative effect by providing more opportunities for users to specify irrelevant terms. To understand these different effects and their implications, this article further analyzes important factors that contribute to the utility of term feedback and discusses the outlook of term feedback in interactive text-based image retrieval.", acknowledgement = ack-nhfb, articleno = "3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Text-based interactive image retrieval; user term feedback", } @Article{Talvensaari:2007:CEC, author = "Tuomas Talvensaari and Jorma Laurikkala and Kalervo J{\"a}rvelin and Martti Juhola and Heikki Keskustalo", title = "Creating and exploiting a comparable corpus in cross-language information retrieval", journal = j-TOIS, volume = "25", number = "1", pages = "4:1--4:??", month = feb, year = "2007", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1198296.1198300", ISSN = "1046-8188", bibdate = "Thu Jun 12 16:51:47 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "We present a method for creating a comparable text corpus from two document collections in different languages. The collections can be very different in origin. In this study, we build a comparable corpus from articles by a Swedish news agency and a U.S. newspaper. The keys with best resolution power were extracted from the documents of one collection, the source collection, by using the relative average term frequency (RATF) value. The keys were translated into the language of the other collection, the target collection, with a dictionary-based query translation program. The translated queries were run against the target collection and an alignment pair was made if the retrieved documents matched given date and similarity score criteria. The resulting comparable collection was used as a similarity thesaurus to translate queries along with a dictionary-based translator. The combined approaches outperformed translation schemes where dictionary-based translation or corpus translation was used alone.", acknowledgement = ack-nhfb, articleno = "4", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "comparable corpora; Cross-language information retrieval; query translation", } @Article{Ma:2007:IBP, author = "Zhongming Ma and Gautam Pant and Olivia R. Liu Sheng", title = "Interest-based personalized search", journal = j-TOIS, volume = "25", number = "1", pages = "5:1--5:??", month = feb, year = "2007", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1198296.1198301", ISSN = "1046-8188", bibdate = "Thu Jun 12 16:51:47 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Web search engines typically provide search results without considering user interests or context. We propose a personalized search approach that can easily extend a conventional search engine on the client side. Our mapping framework automatically maps a set of known user interests onto a group of categories in the Open Directory Project (ODP) and takes advantage of manually edited data available in ODP for training text classifiers that correspond to, and therefore categorize and personalize search results according to user interests. In two sets of controlled experiments, we compare our personalized categorization system (PCAT) with a list interface system (LIST) that mimics a typical search engine and with a nonpersonalized categorization system (CAT). In both experiments, we analyze system performances on the basis of the type of task and query length. We find that PCAT is preferable to LIST for information gathering types of tasks and for searches with short queries, and PCAT outperforms CAT in both information gathering and finding types of tasks, and for searches associated with free-form queries. From the subjects' answers to a questionnaire, we find that PCAT is perceived as a system that can find relevant Web pages quicker and easier than LIST and CAT.", acknowledgement = ack-nhfb, articleno = "5", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "information retrieval; Open Directory; Personalized search; user interest; user interface; World Wide Web", } @Article{Lin:2007:EPU, author = "Jimmy Lin", title = "An exploration of the principles underlying redundancy-based factoid question answering", journal = j-TOIS, volume = "25", number = "2", pages = "6:1--6:??", month = apr, year = "2007", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1229179.1229180", ISSN = "1046-8188", bibdate = "Thu Jun 12 16:51:57 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The so-called ``redundancy-based'' approach to question answering represents a successful strategy for mining answers to factoid questions such as ``Who shot Abraham Lincoln?'' from the World Wide Web. Through contrastive and ablation experiments with Aranea, a system that has performed well in several TREC QA evaluations, this work examines the underlying assumptions and principles behind redundancy-based techniques. Specifically, we develop two theses: that stable characteristics of data redundancy allow factoid systems to rely on external ``black box'' components, and that despite embodying a data-driven approach, redundancy-based methods encode a substantial amount of knowledge in the form of heuristics. Overall, this work attempts to address the broader question of ``what really matters'' and to provide guidance for future researchers.", acknowledgement = ack-nhfb, articleno = "6", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Data redundancy; Web search", } @Article{Joachims:2007:EAI, author = "Thorsten Joachims and Laura Granka and Bing Pan and Helene Hembrooke and Filip Radlinski and Geri Gay", title = "Evaluating the accuracy of implicit feedback from clicks and query reformulations in {Web} search", journal = j-TOIS, volume = "25", number = "2", pages = "7:1--7:??", month = apr, year = "2007", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1229179.1229181", ISSN = "1046-8188", bibdate = "Thu Jun 12 16:51:57 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "This article examines the reliability of implicit feedback generated from clickthrough data and query reformulations in World Wide Web (WWW) search. Analyzing the users' decision process using eyetracking and comparing implicit feedback against manual relevance judgments, we conclude that clicks are informative but biased. While this makes the interpretation of clicks as absolute relevance judgments difficult, we show that relative preferences derived from clicks are reasonably accurate on average. We find that such relative preferences are accurate not only between results from an individual query, but across multiple sets of results within chains of query reformulations.", acknowledgement = ack-nhfb, articleno = "7", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Clickthrough data; eye-tracking; implicit feedback; query reformulations; user studies", } @Article{Cui:2007:SPM, author = "Hang Cui and Min-Yen Kan and Tat-Seng Chua", title = "Soft pattern matching models for definitional question answering", journal = j-TOIS, volume = "25", number = "2", pages = "8:1--8:??", month = apr, year = "2007", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1229179.1229182", ISSN = "1046-8188", bibdate = "Thu Jun 12 16:51:57 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "We explore probabilistic lexico-syntactic pattern matching, also known as soft pattern matching, in a definitional question answering system. Most current systems use regular expression-based hard matching patterns to identify definition sentences. Such rigid surface matching often fares poorly when faced with language variations. We propose two soft matching models to address this problem: one based on bigrams and the other on the Profile Hidden Markov Model (PHMM). Both models provide a theoretically sound method to model pattern matching as a probabilistic process that generates token sequences. We demonstrate the effectiveness of the models on definition sentence retrieval for definitional question answering. We show that both models significantly outperform the state-of-the-art manually constructed hard matching patterns on recent TREC data.\par A critical difference between the two models is that the PHMM has a more complex topology. We experimentally show that the PHMM can handle language variations more effectively but requires more training data to converge.\par While we evaluate soft pattern models only on definitional question answering, we believe that both models are generic and can be extended to other areas where lexico-syntactic pattern matching can be applied.", acknowledgement = ack-nhfb, articleno = "8", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "definitional question answering; Soft patterns", } @Article{Beitzel:2007:ACW, author = "Steven M. Beitzel and Eric C. Jensen and David D. Lewis and Abdur Chowdhury and Ophir Frieder", title = "Automatic classification of {Web} queries using very large unlabeled query logs", journal = j-TOIS, volume = "25", number = "2", pages = "9:1--9:??", month = apr, year = "2007", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1229179.1229183", ISSN = "1046-8188", bibdate = "Thu Jun 12 16:51:57 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Accurate topical classification of user queries allows for increased effectiveness and efficiency in general-purpose Web search systems. Such classification becomes critical if the system must route queries to a subset of topic-specific and resource-constrained back-end databases. Successful query classification poses a challenging problem, as Web queries are short, thus providing few features. This feature sparseness, coupled with the constantly changing distribution and vocabulary of queries, hinders traditional text classification. We attack this problem by combining multiple classifiers, including exact lookup and partial matching in databases of manually classified frequent queries, linear models trained by supervised learning, and a novel approach based on mining selectional preferences from a large unlabeled query log. Our approach classifies queries without using external sources of information, such as online Web directories or the contents of retrieved pages, making it viable for use in demanding operational environments, such as large-scale Web search services. We evaluate our approach using a large sample of queries from an operational Web search engine and show that our combined method increases recall by nearly 40\% over the best single method while maintaining adequate precision. Additionally, we compare our results to those from the 2005 KDD Cup and find that we perform competitively despite our operational restrictions. This suggests it is possible to topically classify a significant portion of the query stream without requiring external sources of information, allowing for deployment in operationally restricted environments.", acknowledgement = ack-nhfb, articleno = "9", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Baralis:2007:AXQ, author = "Elena Baralis and Paolo Garza and Elisa Quintarelli and Letizia Tanca", title = "Answering {XML} queries by means of data summaries", journal = j-TOIS, volume = "25", number = "3", pages = "10:1--10:??", month = jul, year = "2007", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1247715.1247716", ISSN = "1046-8188", bibdate = "Thu Jun 12 16:52:07 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "XML is a rather verbose representation of semistructured data, which may require huge amounts of storage space. We propose a summarized representation of XML data, based on the concept of instance pattern, which can both provide succinct information and be directly queried. The physical representation of instance patterns exploits itemsets or association rules to summarize the content of XML datasets. Instance patterns may be used for (possibly partially) answering queries, either when fast and approximate answers are required, or when the actual dataset is not available, for example, it is currently unreachable. Experiments on large XML documents show that instance patterns allow a significant reduction in storage space, while preserving almost entirely the completeness of the query result. Furthermore, they provide fast query answers and show good scalability on the size of the dataset, thus overcoming the document size limitation of most current XQuery engines.", acknowledgement = ack-nhfb, articleno = "10", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Association rules; data mining; data summarization; intensional answers; itemsets; semistructured data", } @Article{Cormack:2007:OSS, author = "Gordon V. Cormack and Thomas R. Lynam", title = "Online supervised spam filter evaluation", journal = j-TOIS, volume = "25", number = "3", pages = "11:1--11:??", month = jul, year = "2007", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1247715.1247717", ISSN = "1046-8188", bibdate = "Thu Jun 12 16:52:07 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Eleven variants of six widely used open-source spam filters are tested on a chronological sequence of 49086 e-mail messages received by an individual from August 2003 through March 2004. Our approach differs from those previously reported in that the test set is large, comprises uncensored raw messages, and is presented to each filter sequentially with incremental feedback. Misclassification rates and Receiver Operating Characteristic Curve measurements are reported, with statistical confidence intervals. Quantitative results indicate that content-based filters can eliminate 98\% of spam while incurring 0.1\% legitimate email loss. Qualitative results indicate that the risk of loss depends on the nature of the message, and that messages likely to be lost may be those that are less critical. More generally, our methodology has been encapsulated in a free software toolkit, which may used to conduct similar experiments.", acknowledgement = ack-nhfb, articleno = "11", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "email; Spam; text classification", } @Article{Zhou:2007:DPM, author = "Changqing Zhou and Dan Frankowski and Pamela Ludford and Shashi Shekhar and Loren Terveen", title = "Discovering personally meaningful places: an interactive clustering approach", journal = j-TOIS, volume = "25", number = "3", pages = "12:1--12:??", month = jul, year = "2007", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1247715.1247718", ISSN = "1046-8188", bibdate = "Thu Jun 12 16:52:07 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The discovery of a person's meaningful places involves obtaining the physical locations and their labels for a person's places that matter to his daily life and routines. This problem is driven by the requirements from emerging location-aware applications, which allow a user to pose queries and obtain information in reference to places, for example, ``home'', ``work'' or ``Northwest Health Club''. It is a challenge to map from physical locations to personally meaningful places due to a lack of understanding of what constitutes the real users' personally meaningful places. Previous work has explored algorithms to discover personal places from location data. However, we know of no systematic empirical evaluations of these algorithms, leaving designers of location-aware applications in the dark about their choices.\par Our work remedies this situation. We extended a clustering algorithm to discover places. We also defined a set of essential evaluation metrics and an interactive evaluation framework. We then conducted a large-scale experiment that collected real users' location data and personally meaningful places, and illustrated the utility of our evaluation framework. Our results establish a baseline that future work can measure itself against. They also demonstrate that our algorithm discovers places with reasonable accuracy and outperforms the well-known K-Means clustering algorithm for place discovery. Finally, we provide evidence that shapes more complex than ``points'' are required to represent the full range of people's everyday places.", acknowledgement = ack-nhfb, articleno = "12", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "clustering algorithms; field studies; location-aware applications; place discovery; Ubiquitous computing", } @Article{He:2007:SHP, author = "Ben He and Iadh Ounis", title = "On setting the hyper-parameters of term frequency normalization for information retrieval", journal = j-TOIS, volume = "25", number = "3", pages = "13:1--13:??", month = jul, year = "2007", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1247715.1247719", ISSN = "1046-8188", bibdate = "Thu Jun 12 16:52:07 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The setting of the term frequency normalization hyper-parameter suffers from the query dependence and collection dependence problems, which remarkably hurt the robustness of the retrieval performance. Our study in this article investigates three term frequency normalization methods, namely normalization 2, BM25's normalization and the Dirichlet Priors normalization. We tackle the query dependence problem by modifying the query term weight using a Divergence From Randomness term weighting model, and tackle the collection dependence problem by measuring the correlation of the normalized term frequency with the document length. Our research hypotheses for the two problems, as well as an automatic hyper-parameter setting methodology, are extensively validated and evaluated on four Text REtrieval Conference (TREC) collections.", acknowledgement = ack-nhfb, articleno = "13", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "collection-dependence; information retrieval models; Query-dependence; relevance feedback; term frequency normalization; TREC experimentation", } @Article{Jones:2007:TPQ, author = "Rosie Jones and Fernando Diaz", title = "Temporal profiles of queries", journal = j-TOIS, volume = "25", number = "3", pages = "14:1--14:??", month = jul, year = "2007", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1247715.1247720", ISSN = "1046-8188", bibdate = "Thu Jun 12 16:52:07 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Documents with timestamps, such as email and news, can be placed along a timeline. The timeline for a set of documents returned in response to a query gives an indication of how documents relevant to that query are distributed in time. Examining the timeline of a query result set allows us to characterize both how temporally dependent the topic is, as well as how relevant the results are likely to be. We outline characteristic patterns in query result set timelines, and show experimentally that we can automatically classify documents into these classes. We also show that properties of the query result set timeline can help predict the mean average precision of a query. These results show that meta-features associated with a query can be combined with text retrieval techniques to improve our understanding and treatment of text search on documents with timestamps.", acknowledgement = ack-nhfb, articleno = "14", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "ambiguity; event detection; language models; precision prediction; query classification; temporal profiles; Time", } @Article{Marchionini:2007:TRJ, author = "Gary Marchionini", title = "{TOIS} reviewers {January} 2006 through {May} 2007", journal = j-TOIS, volume = "25", number = "4", pages = "15:1--15:??", month = oct, year = "2007", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1281485.1281486", ISSN = "1046-8188", bibdate = "Thu Jun 12 16:52:16 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, articleno = "15", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Bailey:2007:AHT, author = "Christopher Bailey and Wendy Hall and David E. Millard and Mark J. Weal", title = "Adaptive hypermedia through contextualized open hypermedia structures", journal = j-TOIS, volume = "25", number = "4", pages = "16:1--16:??", month = oct, year = "2007", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1281485.1281487", ISSN = "1046-8188", bibdate = "Thu Jun 12 16:52:16 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The aim of this article is to produce an alternative view of the adaptive hypermedia (AH) domain from a contextually-aware open hypermedia (OH) perspective. We believe that a wide range of AH techniques can be supported with a small number of OH structures, which can be combined together to create more complex effects, possibly simplifying the development of new AH systems.\par In this work we reexamine Brusilovsky's taxonomy of AH techniques from a structural OH perspective. We also show that it is possible to identify and model common structures across the taxonomy of adaptive techniques. An agent-based adaptive hypermedia system called HA 3 L is presented, which uses these OH structures to provide a straightforward implementation of a variety of adaptive hypermedia techniques. This enables us to reflect on the structural equivalence of many of the techniques, demonstrates the advantages of the OH approach, and can inform the design of future adaptive hypermedia systems.", acknowledgement = ack-nhfb, articleno = "16", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "adaptive hypermedia; Adaptive techniques; FOHM; hypermedia structure; open hypermedia", } @Article{Fang:2007:SMT, author = "Xiao Fang and Olivia R. Liu Sheng and Michael Chau", title = "{ServiceFinder}: a method towards enhancing service portals", journal = j-TOIS, volume = "25", number = "4", pages = "17:1--17:??", month = oct, year = "2007", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1281485.1281488", ISSN = "1046-8188", bibdate = "Thu Jun 12 16:52:16 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The rapid advancement of Internet technologies enables more and more educational institutes, companies, and government agencies to provide services, namely online services, through web portals. With hundreds of online services provided through a web portal, it is critical to design web portals, namely service portals, through which online services can be easily accessed by their consumers. This article addresses this critical issue from the perspective of service selection, that is, how to select a small number of service-links (i.e., hyperlinks pointing to online services) to be featured in the homepage of a service portal such that users can be directed to find the online services they seek most effectively. We propose a mathematically formulated metric to measure the effectiveness of the selected service-links in directing users to locate their desired online services and formally define the service selection problem. A solution method, ServiceFinder, is then proposed. Using real-world data obtained from the Utah State Government service portal, we show that ServiceFinder outperforms both the current practice of service selection and previous algorithms for adaptive website design. We also show that the performance of ServiceFinder is close to that of the optimal solution resulting from exhaustive search.", acknowledgement = ack-nhfb, articleno = "17", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "online service; Service portal; service selection", } @Article{Majumder:2007:YYA, author = "Prasenjit Majumder and Mandar Mitra and Swapan K. Parui and Gobinda Kole and Pabitra Mitra and Kalyankumar Datta", title = "{YASS}: {Yet} another suffix stripper", journal = j-TOIS, volume = "25", number = "4", pages = "18:1--18:??", month = oct, year = "2007", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1281485.1281489", ISSN = "1046-8188", bibdate = "Thu Jun 12 16:52:16 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Stemmers attempt to reduce a word to its stem or root form and are used widely in information retrieval tasks to increase the recall rate. Most popular stemmers encode a large number of language-specific rules built over a length of time. Such stemmers with comprehensive rules are available only for a few languages. In the absence of extensive linguistic resources for certain languages, statistical language processing tools have been successfully used to improve the performance of IR systems. In this article, we describe a clustering-based approach to discover equivalence classes of root words and their morphological variants. A set of string distance measures are defined, and the lexicon for a given text collection is clustered using the distance measures to identify these equivalence classes. The proposed approach is compared with Porter's and Lovin's stemmers on the AP and WSJ subcollections of the Tipster dataset using 200 queries. Its performance is comparable to that of Porter's and Lovin's stemmers, both in terms of average precision and the total number of relevant documents retrieved. The proposed stemming algorithm also provides consistent improvements in retrieval performance for French and Bengali, which are currently resource-poor.", acknowledgement = ack-nhfb, articleno = "18", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Bengali; clustering; corpus; French; Indian languages; stemming; string similarity", } @Article{Pinto:2007:NXM, author = "Alberto Pinto and Goffredo Haus", title = "A novel {XML} music information retrieval method using graph invariants", journal = j-TOIS, volume = "25", number = "4", pages = "19:1--19:??", month = oct, year = "2007", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1281485.1281490", ISSN = "1046-8188", bibdate = "Thu Jun 12 16:52:16 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The increasing diffusion of XML languages for the encoding of domain-specific multimedia information raises the need for new information retrieval models that can fully exploit structural information. An XML language specifically designed for music like MX allows queries to be made directly on the thematic material. The main advantage of such a system is that it can handle symbolic, notational, and audio objects at the same time through a multilayered structure. On the model side, common music information retrieval methods do not take into account the inner structure of melodic themes and the metric relationships between notes.\par In this article we deal with two main topics: a novel architecture based on a new XML language for music and a new model of melodic themes based on graph theory.\par This model takes advantage of particular graph invariants that can be linked to melodic themes as metadata in order to characterize all their possible modifications through specific transformations and that can be exploited in filtering algorithms. We provide a similarity function and show through an evaluation stage how it improves existing methods, particularly in the case of same-structured themes.", acknowledgement = ack-nhfb, articleno = "19", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Graphs; invariants; melodic similarity; metadata; music; music information retrieval; structural properties; XML", } @Article{Gerstel:2007:RHI, author = "Ori Gerstel and Shay Kutten and Eduardo Sany Laber and Rachel Matichin and David Peleg and Artur Alves Pessoa and Criston Souza", title = "Reducing human interactions in {Web} directory searches", journal = j-TOIS, volume = "25", number = "4", pages = "20:1--20:??", month = oct, year = "2007", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1281485.1281491", ISSN = "1046-8188", bibdate = "Thu Jun 12 16:52:16 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Consider a website containing a collection of webpages with data such as in Yahoo or the Open Directory project. Each page is associated with a weight representing the frequency with which that page is accessed by users. In the tree hierarchy representation, accessing each page requires the user to travel along the path leading to it from the root. By enhancing the index tree with additional edges (hotlinks) one may reduce the access cost of the system. In other words, the hotlinks reduce the expected number of steps needed to reach a leaf page from the tree root, assuming that the user knows which hotlinks to take. The hotlink enhancement problem involves finding a set of hotlinks minimizing this cost.\par This article proposes the first exact algorithm for the hotlink enhancement problem. This algorithm runs in polynomial time for trees with logarithmic depth. Experiments conducted with real data show that significant improvement in the expected number of accesses per search can be achieved in websites using this algorithm. These experiments also suggest that the simple and much faster heuristic proposed previously by Czyzowicz et al. [2003] creates hotlinks that are nearly optimal in the time savings they provide to the user.\par The version of the hotlink enhancement problem in which the weight distribution on the leaves is unknown is discussed as well. We present a polynomial-time algorithm that is optimal for any tree for any depth.", acknowledgement = ack-nhfb, articleno = "20", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "algorithms; directory tree; Hotlink; hotlist; hyperlink", } @Article{Jensen:2007:RES, author = "Eric C. Jensen and Steven M. Beitzel and Abdur Chowdhury and Ophir Frieder", title = "Repeatable evaluation of search services in dynamic environments", journal = j-TOIS, volume = "26", number = "1", pages = "1:1--1:??", month = nov, year = "2007", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1292591.1292592", ISSN = "1046-8188", bibdate = "Thu Jun 12 16:52:26 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "In dynamic environments, such as the World Wide Web, a changing document collection, query population, and set of search services demands frequent repetition of search effectiveness (relevance) evaluations. Reconstructing static test collections, such as in TREC, requires considerable human effort, as large collection sizes demand judgments deep into retrieved pools. In practice it is common to perform shallow evaluations over small numbers of live engines (often pairwise, engine A vs. engine B) without system pooling. Although these evaluations are not intended to construct reusable test collections, their utility depends on conclusions generalizing to the query population as a whole. We leverage the bootstrap estimate of the reproducibility probability of hypothesis tests in determining the query sample sizes required to ensure this, finding they are much larger than those required for static collections. We propose a semiautomatic evaluation framework to reduce this effort. We validate this framework against a manual evaluation of the top ten results of ten Web search engines across 896 queries in navigational and informational tasks. Augmenting manual judgments with pseudo-relevance judgments mined from Web taxonomies reduces both the chances of missing a correct pairwise conclusion, and those of finding an errant conclusion, by approximately 50\%.", acknowledgement = ack-nhfb, articleno = "1", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Evaluation; Web search", } @Article{Pirkola:2007:FBI, author = "Ari Pirkola and Jarmo Toivonen and Heikki Keskustalo and Kalervo J{\"a}rvelin", title = "Frequency-based identification of correct translation equivalents {(FITE)} obtained through transformation rules", journal = j-TOIS, volume = "26", number = "1", pages = "2:1--2:??", month = nov, year = "2007", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1292591.1292593", ISSN = "1046-8188", bibdate = "Thu Jun 12 16:52:26 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "We devised a novel statistical technique for the identification of the translation equivalents of source words obtained by transformation rule based translation (TRT). The effectiveness of the technique called frequency-based identification of translation equivalents ( FITE ) was tested using biological and medical cross-lingual spelling variants and out-of-vocabulary (OOV) words in Spanish--English and Finnish-English TRT. The results showed that, depending on the source language and frequency corpus, FITE-TRT (the identification of translation equivalents from TRT's translation set by means of the FITE technique) may achieve high translation recall. In the case of the Web as the frequency corpus, translation recall was 89.2\%--91.0\% for Spanish--English FITE-TRT. For both language pairs FITE-TRT achieved high translation precision: 95.0\%--98.8\%. The technique also reliably identified native source language words: source words that cannot be correctly translated by TRT. Dictionary-based CLIR augmented with FITE-TRT performed substantially better than basic dictionary-based CLIR where OOV keys were kept intact. FITE-TRT with Web document frequencies was the best technique among several fuzzy translation/matching approaches tested in cross-language retrieval experiments. We also discuss the application of FITE-TRT in the automatic construction of multilingual dictionaries.", acknowledgement = ack-nhfb, articleno = "2", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Cross-language information retrieval; fuzzy matching; OOV words; transformation rules; transliteration", } @Article{Agosti:2007:FMA, author = "Maristella Agosti and Nicola Ferro", title = "A formal model of annotations of digital content", journal = j-TOIS, volume = "26", number = "1", pages = "3:1--3:??", month = nov, year = "2007", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1292591.1292594", ISSN = "1046-8188", bibdate = "Thu Jun 12 16:52:26 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "This article is a study of the themes and issues concerning the annotation of digital contents, such as textual documents, images, and multimedia documents in general. These digital contents are automatically managed by different kinds of digital library management systems and more generally by different kinds of information management systems.\par Even though this topic has already been partially studied by other researchers, the previous research work on annotations has left many open issues. These issues concern the lack of clarity about what an annotation is, what its features are, and how it is used. These issues are mainly due to the fact that models and systems for annotations have only been developed for specific purposes. As a result, there is only a fragmentary picture of the annotation and its management, and this is tied to specific contexts of use and lacks-general validity.\par The aim of the article is to provide a unified and integrated picture of the annotation, ranging from defining what an annotation is to providing a formal model. The key ideas of the model are: the distinction between the meaning and the sign of the annotation, which represent the semantics and the materialization of an annotation, respectively; the clear formalization of the temporal dimension involved with annotations; and the introduction of a distributed hypertext between digital contents and annotations. Therefore, the proposed formal model captures both syntactic and semantic aspects of the annotations. Furthermore, it is built on previously existing models and may be seen as an extension of them.", acknowledgement = ack-nhfb, articleno = "3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Annotation; digital content; digital library system; foundations; hypertext", } @Article{Im:2007:DOS, author = "Il Im and Alexander Hars", title = "Does a one-size recommendation system fit all? the effectiveness of collaborative filtering based recommendation systems across different domains and search modes", journal = j-TOIS, volume = "26", number = "1", pages = "4:1--4:??", month = nov, year = "2007", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1292591.1292595", ISSN = "1046-8188", bibdate = "Thu Jun 12 16:52:26 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Collaborative filtering (CF) is a personalization technology that generates recommendations for users based on others' evaluations. CF is used by numerous e-commerce Web sites for providing personalized recommendations. Although much research has focused on refining collaborative filtering algorithms, little is known about the effects of user and domain characteristics on the accuracy of collaborative filtering systems. In this study, the effects of two factors---product domain and users' search mode---on the accuracy of CF are investigated. The effects of those factors are tested using data collected from two experiments in two different product domains, and from two large CF datasets, EachMovie and Book-Crossing. The study shows that the search mode of the users strongly influences the accuracy of the recommendations. CF works better when users look for specific information than when they search for general information. The accuracy drops significantly when data from different modes are mixed. The study also shows that CF is more accurate for knowledge domains than for consumer product domains. The results of this study imply that for more accurate recommendations, collaborative filtering systems should be able to identify and handle users' mode of search, even within the same domain and user group.", acknowledgement = ack-nhfb, articleno = "4", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Collaborative filtering; recommendation systems", } @Article{Darwish:2007:ECV, author = "Kareem Darwish and Walid Magdy", title = "Error correction vs. query garbling for {Arabic OCR} document retrieval", journal = j-TOIS, volume = "26", number = "1", pages = "5:1--5:??", month = nov, year = "2007", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1292591.1292596", ISSN = "1046-8188", bibdate = "Thu Jun 12 16:52:26 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Due to the existence of large numbers of legacy documents (such as old books and newspapers), improving retrieval effectiveness for OCR'ed documents continues to be an important problem. This article compares the effect of OCR error correction with and without language modeling and the effect of query garbling with weighted structured queries on the retrieval of OCR degraded Arabic documents. The results suggest that moderate error correction does not yield statistically significant improvement in retrieval effectiveness when indexing and searching using n-grams. Also, reversing error correction models to perform query garbling in conjunction with weighted structured queries yields improved retrieval effectiveness. Lastly, using very good error correction that utilizes language modeling yields the best improvement in retrieval effectiveness.", acknowledgement = ack-nhfb, articleno = "5", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Arabic Retrieval; OCR Correction; OCR Retrieval", } @Article{Ipeirotis:2008:CAH, author = "Panagiotis G. Ipeirotis and Luis Gravano", title = "Classification-aware hidden-web text database selection", journal = j-TOIS, volume = "26", number = "2", pages = "6:1--6:??", month = mar, year = "2008", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1344411.1344412", ISSN = "1046-8188", bibdate = "Thu Jun 12 16:52:34 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Many valuable text databases on the web have noncrawlable contents that are ``hidden'' behind search interfaces. Metasearchers are helpful tools for searching over multiple such ``hidden-web'' text databases at once through a unified query interface. An important step in the metasearching process is database selection, or determining which databases are the most relevant for a given user query. The state-of-the-art database selection techniques rely on statistical summaries of the database contents, generally including the database vocabulary and associated word frequencies. Unfortunately, hidden-web text databases typically do not export such summaries, so previous research has developed algorithms for constructing approximate content summaries from document samples extracted from the databases via querying. We present a novel ``focused-probing'' sampling algorithm that detects the topics covered in a database and adaptively extracts documents that are representative of the topic coverage of the database. Our algorithm is the first to construct content summaries that include the frequencies of the words in the database. Unfortunately, Zipf's law practically guarantees that for any relatively large database, content summaries built from moderately sized document samples will fail to cover many low-frequency words; in turn, incomplete content summaries might negatively affect the database selection process, especially for short queries with infrequent words. To enhance the sparse document samples and improve the database selection decisions, we exploit the fact that topically similar databases tend to have similar vocabularies, so samples extracted from databases with a similar topical focus can complement each other. We have developed two database selection algorithms that exploit this observation. The first algorithm proceeds hierarchically and selects the best categories for a query, and then sends the query to the appropriate databases in the chosen categories. The second algorithm uses ``shrinkage,'' a statistical technique for improving parameter estimation in the face of sparse data, to enhance the database content summaries with category-specific words. We describe how to modify existing database selection algorithms to adaptively decide (at runtime) whether shrinkage is beneficial for a query. A thorough evaluation over a variety of databases, including 315 real web databases as well as TREC data, suggests that the proposed sampling methods generate high-quality content summaries and that the database selection algorithms produce significantly more relevant database selection decisions and overall search results than existing algorithms.", acknowledgement = ack-nhfb, articleno = "6", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "database selection; Distributed information retrieval; web search", } @Article{Abbasi:2008:WSA, author = "Ahmed Abbasi and Hsinchun Chen", title = "Writeprints: a stylometric approach to identity-level identification and similarity detection in cyberspace", journal = j-TOIS, volume = "26", number = "2", pages = "7:1--7:??", month = mar, year = "2008", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1344411.1344413", ISSN = "1046-8188", bibdate = "Thu Jun 12 16:52:34 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "One of the problems often associated with online anonymity is that it hinders social accountability, as substantiated by the high levels of cybercrime. Although identity cues are scarce in cyberspace, individuals often leave behind textual identity traces. In this study we proposed the use of stylometric analysis techniques to help identify individuals based on writing style. We incorporated a rich set of stylistic features, including lexical, syntactic, structural, content-specific, and idiosyncratic attributes. We also developed the Writeprints technique for identification and similarity detection of anonymous identities. Writeprints is a Karhunen-Loeve transforms-based technique that uses a sliding window and pattern disruption algorithm with individual author-level feature sets. The Writeprints technique and extended feature set were evaluated on a testbed encompassing four online datasets spanning different domains: email, instant messaging, feedback comments, and program code. Writeprints outperformed benchmark techniques, including SVM, Ensemble SVM, PCA, and standard Karhunen-Loeve transforms, on the identification and similarity detection tasks with accuracy as high as 94\% when differentiating between 100 authors. The extended feature set also significantly outperformed a baseline set of features commonly used in previous research. Furthermore, individual-author-level feature sets generally outperformed use of a single group of attributes.", acknowledgement = ack-nhfb, articleno = "7", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "discourse; online text; style classification; Stylometry; text mining", } @Article{Lau:2008:TBR, author = "Raymond Y. K. Lau and Peter D. Bruza and Dawei Song", title = "Towards a belief-revision-based adaptive and context-sensitive information retrieval system", journal = j-TOIS, volume = "26", number = "2", pages = "8:1--8:??", month = mar, year = "2008", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1344411.1344414", ISSN = "1046-8188", bibdate = "Thu Jun 12 16:52:34 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "In an adaptive information retrieval (IR) setting, the information seekers' beliefs about which terms are relevant or nonrelevant will naturally fluctuate. This article investigates how the theory of belief revision can be used to model adaptive IR. More specifically, belief revision logic provides a rich representation scheme to formalize retrieval contexts so as to disambiguate vague user queries. In addition, belief revision theory underpins the development of an effective mechanism to revise user profiles in accordance with information seekers' changing information needs. It is argued that information retrieval contexts can be extracted by means of the information-flow text mining method so as to realize a highly autonomous adaptive IR system. The extra bonus of a belief-based IR model is that its retrieval behavior is more predictable and explanatory. Our initial experiments show that the belief-based adaptive IR system is as effective as a classical adaptive IR system. To our best knowledge, this is the first successful implementation and evaluation of a logic-based adaptive IR model which can efficiently process large IR collections.", acknowledgement = ack-nhfb, articleno = "8", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "adaptive information retrieval; Belief revision; information flow; retrieval context; text mining", } @Article{deMoura:2008:LBP, author = "Edleno Silva de Moura and Celia Francisca dos Santos and Bruno Dos santos de Araujo and Altigran Soares da Silva and Pavel Calado and Mario A. Nascimento", title = "Locality-Based pruning methods for web search", journal = j-TOIS, volume = "26", number = "2", pages = "9:1--9:??", month = mar, year = "2008", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1344411.1344415", ISSN = "1046-8188", bibdate = "Thu Jun 12 16:52:34 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "This article discusses a novel approach developed for static index pruning that takes into account the locality of occurrences of words in the text. We use this new approach to propose and experiment on simple and effective pruning methods that allow a fast construction of the pruned index. The methods proposed here are especially useful for pruning in environments where the document database changes continuously, such as large-scale web search engines. Extensive experiments are presented showing that the proposed methods can achieve high compression rates while maintaining the quality of results for the most common query types present in modern search engines, namely, conjunctive and phrase queries. In the experiments, our locality-based pruning approach allowed reducing search engine indices to 30\% of their original size, with almost no reduction in precision at the top answers. Furthermore, we conclude that even an extremely simple locality-based pruning method can be competitive when compared to complex methods that do not rely on locality information.", acknowledgement = ack-nhfb, articleno = "9", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "indexing; information retrieval; Pruning; search; search engines; web search", } @Article{Wang:2008:DSZ, author = "Xuanhui Wang and Tao Tao and Jian-Tao Sun and Azadeh Shakery and Chengxiang Zhai", title = "{DirichletRank}: {Solving} the zero-one gap problem of {PageRank}", journal = j-TOIS, volume = "26", number = "2", pages = "10:1--10:??", month = mar, year = "2008", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1344411.1344416", ISSN = "1046-8188", bibdate = "Thu Jun 12 16:52:34 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Link-based ranking algorithms are among the most important techniques to improve web search. In particular, the PageRank algorithm has been successfully used in the Google search engine and has been attracting much attention recently. However, we find that PageRank has a ``zero-one gap'' problem which, to the best of our knowledge, has not been addressed in any previous work. This problem can be potentially exploited to spam PageRank results and make the state-of-the-art link-based antispamming techniques ineffective. The zero-one gap problem arises as a result of the current ad hoc way of computing transition probabilities in the random surfing model. We therefore propose a novel DirichletRank algorithm which calculates these probabilities using Bayesian estimation with a Dirichlet prior. DirichletRank is a variant of PageRank, but does not have the problem of zero-one gap and can be analytically shown substantially more resistant to some link spams than PageRank. Experiment results on TREC data show that DirichletRank can achieve better retrieval accuracy than PageRank due to its more reasonable allocation of transition probabilities. More importantly, experiments on the TREC dataset and another real web dataset from the Webgraph project show that, compared with the original PageRank, DirichletRank is more stable under link perturbation and is significantly more robust against both manually identified web spams and several simulated link spams. DirichletRank can be computed as efficiently as PageRank, and thus is scalable to large-scale web applications.", acknowledgement = ack-nhfb, articleno = "10", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "DirichletRank; link analysis; PageRank; spamming; zero-one gap", } @Article{Cohen:2008:RTD, author = "Sara Cohen and Carmel Domshlak and Naama Zwerdling", title = "On ranking techniques for desktop search", journal = j-TOIS, volume = "26", number = "2", pages = "11:1--11:??", month = mar, year = "2008", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1344411.1344417", ISSN = "1046-8188", bibdate = "Thu Jun 12 16:52:34 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Users tend to store huge amounts of files, of various formats, on their personal computers. As a result, finding a specific, desired file within the file system is a challenging task. This article addresses the desktop search problem by considering various techniques for ranking results of a search query over the file system. First, basic ranking techniques, which are based on various file features (e.g., file name, access date, file size, etc.), are considered and their effectiveness is empirically analyzed. Next, two learning-based ranking schemes are presented, and are shown to be significantly more effective than the basic ranking methods. Finally, a novel ranking technique, based on query selectiveness, is considered for use during the cold-start period of the system. This method is also shown to be empirically effective, even though it does not involve any learning.", acknowledgement = ack-nhfb, articleno = "11", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Desktop search; personal information management; ranking", } @Article{Abbasi:2008:SAM, author = "Ahmed Abbasi and Hsinchun Chen and Arab Salem", title = "Sentiment analysis in multiple languages: {Feature} selection for opinion classification in {Web} forums", journal = j-TOIS, volume = "26", number = "3", pages = "12:1--12:??", month = jun, year = "2008", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1361684.1361685", ISSN = "1046-8188", bibdate = "Thu Jun 19 08:32:17 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The Internet is frequently used as a medium for exchange of information and opinions, as well as propaganda dissemination. In this study the use of sentiment analysis methodologies is proposed for classification of Web forum opinions in multiple languages. The utility of stylistic and syntactic features is evaluated for sentiment classification of English and Arabic content. Specific feature extraction components are integrated to account for the linguistic characteristics of Arabic. The entropy weighted genetic algorithm (EWGA) is also developed, which is a hybridized genetic algorithm that incorporates the information-gain heuristic for feature selection. EWGA is designed to improve performance and get a better assessment of key features. The proposed features and techniques are evaluated on a benchmark movie review dataset and U.S. and Middle Eastern Web forum postings. The experimental results using EWGA with SVM indicate high performance levels, with accuracies of over 91\\% on the benchmark dataset as well as the U.S. and Middle Eastern forums. Stylistic features significantly enhanced performance across all testbeds while EWGA also outperformed other feature selection methods, indicating the utility of these features and techniques for document-level classification of sentiments.", acknowledgement = ack-nhfb, articleno = "12", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "feature selection; opinion mining; Sentiment analysis; text classification", } @Article{Wu:2008:ITI, author = "Ho Chung Wu and Robert Wing Pong Luk and Kam Fai Wong and Kui Lam Kwok", title = "Interpreting {TF-IDF} term weights as making relevance decisions", journal = j-TOIS, volume = "26", number = "3", pages = "13:1--13:??", month = jun, year = "2008", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1361684.1361686", ISSN = "1046-8188", bibdate = "Thu Jun 19 08:32:17 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "A novel probabilistic retrieval model is presented. It forms a basis to interpret the TF-IDF term weights as making relevance decisions. It simulates the local relevance decision-making for every location of a document, and combines all of these ``local'' relevance decisions as the ``document-wide'' relevance decision for the document. The significance of interpreting TF-IDF in this way is the potential to: (1) establish a unifying perspective about information retrieval as relevance decision-making; and (2) develop advanced TF-IDF-related term weights for future elaborate retrieval models. Our novel retrieval model is simplified to a basic ranking formula that directly corresponds to the TF-IDF term weights. In general, we show that the term-frequency factor of the ranking formula can be rendered into different term-frequency factors of existing retrieval systems. In the basic ranking formula, the remaining quantity $-\log p(\bar{r}| t \in d)$ is interpreted as the probability of randomly picking a nonrelevant usage (denoted by $\bar{r}$) of term $t$. Mathematically, we show that this quantity can be approximated by the inverse document-frequency (IDF). Empirically, we show that this quantity is related to IDF, using four reference TREC ad hoc retrieval data collections.", acknowledgement = ack-nhfb, articleno = "13", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Information retrieval; relevance decision; term weight", } @Article{Melucci:2008:BIR, author = "Massimo Melucci", title = "A basis for information retrieval in context", journal = j-TOIS, volume = "26", number = "3", pages = "14:1--14:??", month = jun, year = "2008", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1361684.1361687", ISSN = "1046-8188", bibdate = "Thu Jun 19 08:32:17 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Information retrieval (IR) models based on vector spaces have been investigated for a long time. Nevertheless, they have recently attracted much research interest. In parallel, context has been rediscovered as a crucial issue in information retrieval. This article presents a principled approach to modeling context and its role in ranking information objects using vector spaces. First, the article outlines how a basis of a vector space naturally represents context, both its properties and factors. Second, a ranking function computes the probability of context in the objects represented in a vector space, namely, the probability that a contextual factor has affected the preparation of an object.", acknowledgement = ack-nhfb, articleno = "14", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Personalization; probability; quantum mechanics; vector-space model", } @Article{Altingovde:2008:ICB, author = "Ismail Sengor Altingovde and Engin Demir and Fazli Can and {\"O}zg{\"u}r Ulusoy", title = "Incremental cluster-based retrieval using compressed cluster-skipping inverted files", journal = j-TOIS, volume = "26", number = "3", pages = "15:1--15:??", month = jun, year = "2008", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1361684.1361688", ISSN = "1046-8188", bibdate = "Thu Jun 19 08:32:17 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "We propose a unique cluster-based retrieval (CBR) strategy using a new cluster-skipping inverted file for improving query processing efficiency. The new inverted file incorporates cluster membership and centroid information along with the usual document information into a single structure. In our incremental-CBR strategy, during query evaluation, both best(-matching) clusters and the best(-matching) documents of such clusters are computed together with a single posting-list access per query term. As we switch from term to term, the best clusters are recomputed and can dynamically change. During query-document matching, only relevant portions of the posting lists corresponding to the best clusters are considered and the rest are skipped. The proposed approach is essentially tailored for environments where inverted files are compressed, and provides substantial efficiency improvement while yielding comparable, or sometimes better, effectiveness figures. Our experiments with various collections show that the incremental-CBR strategy using a compressed cluster-skipping inverted file significantly improves CPU time efficiency, regardless of query length. The new compressed inverted file imposes an acceptable storage overhead in comparison to a typical inverted file. We also show that our approach scales well with the collection size.", acknowledgement = ack-nhfb, articleno = "15", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Best match; cluster-based retrieval (CBR); cluster-skipping inverted index structure (CS-IIS); full search (FS); index compression; inverted index structure (IIS); query processing", } @Article{Wang:2008:URM, author = "Jun Wang and Arjen P. de Vries and Marcel J. T. Reinders", title = "Unified relevance models for rating prediction in collaborative filtering", journal = j-TOIS, volume = "26", number = "3", pages = "16:1--16:??", month = jun, year = "2008", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1361684.1361689", ISSN = "1046-8188", bibdate = "Thu Jun 19 08:32:17 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Collaborative filtering aims at predicting a user's interest for a given item based on a collection of user profiles. This article views collaborative filtering as a problem highly related to information retrieval, drawing an analogy between the concepts of users and items in recommender systems and queries and documents in text retrieval.\par We present a probabilistic user-to-item relevance framework that introduces the concept of relevance into the related problem of collaborative filtering. Three different models are derived, namely, a user-based, an item-based, and a unified relevance model, and we estimate their rating predictions from three sources: the user's own ratings for different items, other users' ratings for the same item, and ratings from different but similar users for other but similar items.\par To reduce the data sparsity encountered when estimating the probability density function of the relevance variable, we apply the nonparametric (data-driven) density estimation technique known as the Parzen-window method (or kernel-based density estimation). Using a Gaussian window function, the similarity between users and/or items would, however, be based on Euclidean distance. Because the collaborative filtering literature has reported improved prediction accuracy when using cosine similarity, we generalize the Parzen-window method by introducing a projection kernel.\par Existing user-based and item-based approaches correspond to two simplified instantiations of our framework. User-based and item-based collaborative filterings represent only a partial view of the prediction problem, where the unified relevance model brings these partial views together under the same umbrella. Experimental results complement the theoretical insights with improved recommendation accuracy. The unified model is more robust to data sparsity because the different types of ratings are used in concert.", acknowledgement = ack-nhfb, articleno = "16", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Collaborative filtering; personalization; recommendation", } @Article{Losada:2008:AMB, author = "David E. Losada and Leif Azzopardi", title = "Assessing multivariate {Bernoulli} models for information retrieval", journal = j-TOIS, volume = "26", number = "3", pages = "17:1--17:??", month = jun, year = "2008", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1361684.1361690", ISSN = "1046-8188", bibdate = "Thu Jun 19 08:32:17 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Although the seminal proposal to introduce language modeling in information retrieval was based on a multivariate Bernoulli model, the predominant modeling approach is now centered on multinomial models. Language modeling for retrieval based on multivariate Bernoulli distributions is seen inefficient and believed less effective than the multinomial model. In this article, we examine the multivariate Bernoulli model with respect to its successor and examine its role in future retrieval systems. In the context of Bayesian learning, these two modeling approaches are described, contrasted, and compared both theoretically and computationally. We show that the query likelihood following a multivariate Bernoulli distribution introduces interesting retrieval features which may be useful for specific retrieval tasks such as sentence retrieval. Then, we address the efficiency aspect and show that algorithms can be designed to perform retrieval efficiently for multivariate Bernoulli models, before performing an empirical comparison to study the behaviorial aspects of the models. A series of comparisons is then conducted on a number of test collections and retrieval tasks to determine the empirical and practical differences between the different models. Our results indicate that for sentence retrieval the multivariate Bernoulli model can significantly outperform the multinomial model. However, for the other tasks the multinomial model provides consistently better performance (and in most cases significantly so). An analysis of the various retrieval characteristics reveals that the multivariate Bernoulli model tends to promote long documents whose nonquery terms are informative. While this is detrimental to the task of document retrieval (documents tend to contain considerable nonquery content), it is valuable for other tasks such as sentence retrieval, where the retrieved elements are very short and focused.", acknowledgement = ack-nhfb, articleno = "17", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Information retrieval; language models; multinomial; multivariate Bernoulli", } @Article{Barreau:2008:IKR, author = "Deborah Barreau and Robert Capra and Susan Dumais and William Jones and Manuel P{\'e}rez-Qui{\~n}ones", title = "Introduction to keeping, refinding and sharing personal information", journal = j-TOIS, volume = "26", number = "4", pages = "18:1--18:??", month = sep, year = "2008", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1402256.1402257", ISSN = "1046-8188", bibdate = "Mon Oct 6 15:21:17 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, articleno = "18", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Teevan:2008:HPR, author = "Jaime Teevan", title = "How people recall, recognize, and reuse search results", journal = j-TOIS, volume = "26", number = "4", pages = "19:1--19:??", month = sep, year = "2008", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1402256.1402258", ISSN = "1046-8188", bibdate = "Mon Oct 6 15:21:17 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "When a person issues a query, that person has expectations about the search results that will be returned. These expectations can be based on the current information need, but are also influenced by how the searcher believes the search engine works, where relevant results are expected to be ranked, and any previous searches the individual has run on the topic. This paper looks in depth at how the expectations people develop about search result lists during an initial query affect their perceptions of and interactions with future repeat search result lists. Three studies are presented that give insight into how people recall, recognize, and reuse results. The first study (a study of {\em recall\/}) explores what people recall about previously viewed search result lists. The second study (a study of {\em recognition\/}) builds on the first to reveal that people often recognize a result list as one they have seen before even when it is quite different. As long as those aspects that the searcher remembers about the initial list remain the same, other aspects can change significantly. This is advantageous because, as the third study (a study of {\em reuse\/}) shows, when a result list appears to have changed, people have trouble re-using the previously viewed content in the list. They are less likely to find what they are looking for, less happy with the result quality, more likely to find the task hard, and more likely to take a long time searching. Although apparent consistency is important for reuse, people's inability to recognize change makes consistency without stagnation possible. New relevant results can be presented where old results have been forgotten, making both old and new content easy to find.", acknowledgement = ack-nhfb, articleno = "19", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "dynamic information; personal information management; recall; recognition; Refinding; reuse; search", } @Article{Bergman:2008:ISE, author = "Ofer Bergman and Ruth Beyth-Marom and Rafi Nachmias and Noa Gradovitch and Steve Whittaker", title = "Improved search engines and navigation preference in personal information management", journal = j-TOIS, volume = "26", number = "4", pages = "20:1--20:??", month = sep, year = "2008", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1402256.1402259", ISSN = "1046-8188", bibdate = "Mon Oct 6 15:21:17 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Traditionally users access their personal files mainly by using folder navigation. We evaluate whether recent improvements in desktop search have changed this fundamental aspect of Personal Information Management (PIM). We tested this in two studies using the same questionnaire: (a) The Windows Study --- a longitudinal comparison of {\em Google Desktop\/} and {\em Windows XP Search Companion}, and (b) The Mac Study --- a large scale comparison of Mac {\em Spotlight\/} and {\em Sherlock}. There were few effects for improved search. First, regardless of search engine, there was a strong navigation preference: on average, users estimated that they used navigation for 56--68\% of file retrieval events but searched for only 4--15\% of events. Second, the effect of improving the quality of the search engine on search usage was limited and inconsistent. Third, search was used mainly as a last resort when users could not remember file location. Finally, there was no evidence that using improved desktop search engines leads people to change their filing habits to become less reliant on hierarchical file organization. We conclude by offering theoretical explanations for navigation preference, relating to differences between PIM and Internet retrieval, and suggest alternative design directions for PIM systems.", acknowledgement = ack-nhfb, articleno = "20", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "files retrieval; navigation preference; Personal information management; personal search engines; search preference; user study", } @Article{Elsweiler:2008:EME, author = "David Elsweiler and Mark Baillie and Ian Ruthven", title = "Exploring memory in email refinding", journal = j-TOIS, volume = "26", number = "4", pages = "21:1--21:??", month = sep, year = "2008", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1402256.1402260", ISSN = "1046-8188", bibdate = "Mon Oct 6 15:21:17 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Human memory plays an important role in personal information management (PIM). Several scholars have noted that people refind information based on what they remember and it has been shown that people adapt their management strategies to compensate for the limitations of memory. Nevertheless, little is known about what people tend to remember about their personal information and how they use their memories to refind. The aim of this article is to increase our understanding of the role that memory plays in the process of refinding personal information. Concentrating on email re-finding, we report on a user study that investigates what attributes of email messages participants remember when trying to refind. We look at how the attributes change in different scenarios and examine the factors which impact on what is remembered.", acknowledgement = ack-nhfb, articleno = "21", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Email refinding; information refinding; memory; user study", } @Article{Siersdorfer:2008:MMM, author = "Stefan Siersdorfer and Sergej Sizov", title = "Meta methods for model sharing in personal information systems", journal = j-TOIS, volume = "26", number = "4", pages = "22:1--22:??", month = sep, year = "2008", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1402256.1402261", ISSN = "1046-8188", bibdate = "Mon Oct 6 15:21:17 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "This article introduces a methodology for automatically organizing document collections into thematic categories for Personal Information Management (PIM) through collaborative sharing of machine learning models in an efficient and privacy-preserving way. Our objective is to combine multiple independently learned models from several users to construct an advanced ensemble-based decision model by taking the knowledge of multiple users into account in a decentralized manner, for example, in a peer-to-peer overlay network. High accuracy of the corresponding supervised (classification) and unsupervised (clustering) methods is achieved by restrictively leaving out uncertain documents rather than assigning them to inappropriate topics or clusters with low confidence. We introduce a formal probabilistic model for the resulting ensemble based meta methods and explain how it can be used for constructing estimators and for goal-oriented tuning. Comprehensive evaluation results on different reference data sets illustrate the viability of our approach.", acknowledgement = ack-nhfb, articleno = "22", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Classification; clustering; meta methods; peer-to-peer; personal information management; restrictive methods", } @Article{Hicks:2008:OMP, author = "B. J. Hicks and A. Dong and R. Palmer and H. C. Mcalpine", title = "Organizing and managing personal electronic files: a mechanical engineer's perspective", journal = j-TOIS, volume = "26", number = "4", pages = "23:1--23:??", month = sep, year = "2008", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1402256.1402262", ISSN = "1046-8188", bibdate = "Mon Oct 6 15:21:17 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "This article deals with the organization and management of the computer files handled by mechanical engineers on their personal computers. In engineering organizations, a wide variety of electronic files (documents) are necessary to support both business processes and the activities of design and manufacture. Whilst a large number of files and hence information is formally archived, a significant amount of additional information and knowledge resides in electronic files on personal computers. The widespread use of these personal information stores means that all information is retained. However, its reuse is problematic for all but the individual as a result of the naming and organization of the files. To begin to address this issue, a study of the use and current practices for managing personal electronic files is described. The study considers the fundamental classes of files handled by engineers and analyses the organization of these files across the personal computers of 40 participants. The study involves a questionnaire and an electronic audit. The results of these qualitative and quantitative elements are used to elicit an understanding of the practices and requirements of engineers for managing personal electronic files. A potential scheme for naming and organizing personal electronic files is discussed as one possible way to satisfy these requirements. The aim of the scheme is to balance the personal nature of data storage with the need for personal records to be shared with others to support knowledge reuse in engineering organizations. Although this article is concerned with mechanical engineers, the issues dealt with are relevant to knowledge-based industries and, in particular, teams of knowledge workers.", acknowledgement = ack-nhfb, articleno = "23", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "directory and file naming conventions; Engineers; file sharing and file recognition and recall; information management", } @Article{Bernstein:2008:ISH, author = "Michael Bernstein and Max {Van Kleek} and David Karger and M. C. Schraefel", title = "Information scraps: {How} and why information eludes our personal information management tools", journal = j-TOIS, volume = "26", number = "4", pages = "24:1--24:??", month = sep, year = "2008", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1402256.1402263", ISSN = "1046-8188", bibdate = "Mon Oct 6 15:21:17 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "In this article we investigate {\em information scraps\/} --- personal information where content has been scribbled on Post-it notes, scrawled on the corners of sheets of paper, stuck in our pockets, sent in email messages to ourselves, and stashed in miscellaneous digital text files. Information scraps encode information ranging from ideas and sketches to notes, reminders, shipment tracking numbers, driving directions, and even poetry. Although information scraps are ubiquitous, we have much still to learn about these loose forms of information practice. Why do we keep information scraps outside of our traditional PIM applications? What role do information scraps play in our overall information practice? How might PIM applications be better designed to accommodate and support information scraps' creation, manipulation and retrieval?\par We pursued these questions by studying the information scrap practices of 27 knowledge workers at five organizations. Our observations shed light on information scraps' content, form, media, and location. From this data, we elaborate on the typical information scrap lifecycle, and identify common roles that information scraps play: temporary storage, archiving, work-in-progress, reminding, and management of unusual data. These roles suggest a set of unmet design needs in current PIM tools: lightweight entry, unconstrained content, flexible use and adaptability, visibility, and mobility.", acknowledgement = ack-nhfb, articleno = "24", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "information scraps; note taking; Personal information management", } @Article{Marchionini:2008:ERM, author = "Gary Marchionini", title = "Editorial: {Reviewer} merits and review control in an age of electronic manuscript management systems", journal = j-TOIS, volume = "26", number = "4", pages = "25:1--25:??", month = sep, year = "2008", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1402256.1402264", ISSN = "1046-8188", bibdate = "Mon Oct 6 15:21:17 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Peer review is an important resource of scholarly communities and must be managed and nurtured carefully. Electronic manuscript management systems have begun to improve some aspects of workflow for conferences and journals but also raise issues related to reviewer roles and reputations and the control of reviews over time. Professional societies should make their policies related to reviews and reviewer histories clear to authors and reviewers, develop strategies and tools to facilitate good and timely reviews, and facilitate the training of new reviewers.", acknowledgement = ack-nhfb, articleno = "25", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "manuscript management systems; Peer review", } @Article{Marchionini:2008:TRJ, author = "Gary Marchionini", title = "{TOIS} reviewers {June 2007} through {May 2008}", journal = j-TOIS, volume = "26", number = "4", pages = "26:1--26:??", month = sep, year = "2008", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1402256.1402265", ISSN = "1046-8188", bibdate = "Mon Oct 6 15:21:17 MDT 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, articleno = "26", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Piwowarski:2008:SCR, author = "Benjamin Piwowarski and Andrew Trotman and Mounia Lalmas", title = "Sound and complete relevance assessment for {XML} retrieval", journal = j-TOIS, volume = "27", number = "1", pages = "1:1--1:??", month = dec, year = "2008", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1416950.1416951", ISSN = "1046-8188", bibdate = "Tue Dec 23 13:49:17 MST 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "In information retrieval research, comparing retrieval approaches requires test collections consisting of documents, user requests and relevance assessments. Obtaining relevance assessments that are as sound and complete as possible is crucial for the comparison of retrieval approaches. In XML retrieval, the problem of obtaining sound and complete relevance assessments is further complicated by the structural relationships between retrieval results.\par A major difference between XML retrieval and flat document retrieval is that the relevance of elements (the retrievable units) is not independent of that of related elements. This has major consequences for the gathering of relevance assessments. This article describes investigations into the creation of sound and complete relevance assessments for the evaluation of content-oriented XML retrieval as carried out at INEX, the evaluation campaign for XML retrieval. The campaign, now in its seventh year, has had three substantially different approaches to gather assessments and has finally settled on a highlighting method for marking relevant passages within documents --- even though the objective is to collect assessments at element level. The different methods of gathering assessments at INEX are discussed and contrasted. The highlighting method is shown to be the most reliable of the methods.", acknowledgement = ack-nhfb, articleno = "1", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "evaluation; INEX; passage retrieval; relevance assessment; XML; XML retrieval", } @Article{Moffat:2008:RBP, author = "Alistair Moffat and Justin Zobel", title = "Rank-biased precision for measurement of retrieval effectiveness", journal = j-TOIS, volume = "27", number = "1", pages = "2:1--2:??", month = dec, year = "2008", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1416950.1416952", ISSN = "1046-8188", bibdate = "Tue Dec 23 13:49:17 MST 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "A range of methods for measuring the effectiveness of information retrieval systems has been proposed. These are typically intended to provide a quantitative single-value summary of a document ranking relative to a query. However, many of these measures have failings. For example, recall is not well founded as a measure of satisfaction, since the user of an actual system cannot judge recall. Average precision is derived from recall, and suffers from the same problem. In addition, average precision lacks key stability properties that are needed for robust experiments. In this article, we introduce a new effectiveness metric, {\em rank-biased precision}, that avoids these problems. Rank-biased precision is derived from a simple model of user behavior, is robust if answer rankings are extended to greater depths, and allows accurate quantification of experimental uncertainty, even when only partial relevance judgments are available.", acknowledgement = ack-nhfb, articleno = "2", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "average precision; pooling; precision; Recall; relevance", } @Article{Zheleva:2008:TSR, author = "Elena Zheleva and Aleksander Kolcz and Lise Getoor", title = "Trusting spam reporters: a reporter-based reputation system for email filtering", journal = j-TOIS, volume = "27", number = "1", pages = "3:1--3:??", month = dec, year = "2008", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1416950.1416953", ISSN = "1046-8188", bibdate = "Tue Dec 23 13:49:17 MST 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Spam is a growing problem; it interferes with valid email and burdens both email users and service providers. In this work, we propose a reactive spam-filtering system based on reporter reputation for use in conjunction with existing spam-filtering techniques. The system has a trust-maintenance component for users, based on their spam-reporting behavior. The challenge that we consider is that of maintaining a reliable system, not vulnerable to malicious users, that will provide early spam-campaign detection to reduce the costs incurred by users and systems. We report on the utility of a reputation system for spam filtering that makes use of the feedback of trustworthy users. We evaluate our proposed framework, using actual complaint feedback from a large population of users, and validate its spam-filtering performance on a collection of real email traffic over several weeks. To test the broader implication of the system, we create a model of the behavior of malicious reporters, and we simulate the system under various assumptions using a synthetic dataset.", acknowledgement = ack-nhfb, articleno = "3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "reputation systems; Spam filtering; trust", } @Article{Yeh:2008:EPH, author = "Jui-Feng Yeh and Chung-Hsien Wu and Liang-Chih Yu and Yu-Sheng Lai", title = "Extended probabilistic {HAL} with close temporal association for psychiatric query document retrieval", journal = j-TOIS, volume = "27", number = "1", pages = "4:1--4:??", month = dec, year = "2008", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1416950.1416954", ISSN = "1046-8188", bibdate = "Tue Dec 23 13:49:17 MST 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Psychiatric query document retrieval can assist individuals to locate query documents relevant to their depression-related problems efficiently and effectively. By referring to relevant documents, individuals can understand how to alleviate their depression-related symptoms according to recommendations from health professionals. This work presents an extended probabilistic {\em Hyperspace Analog to Language\/} ({\em epHAL\/}) model to achieve this aim. The epHAL incorporates the close temporal associations between words in query documents to represent word cooccurrence relationships in a high-dimensional context space. The information flow mechanism further combines the query words in the epHAL space to infer related words for effective information retrieval. The language model perplexity is considered as the criterion for model optimization. Finally, the epHAL is adopted for psychiatric query document retrieval, and indicates its superiority in information retrieval over traditional approaches.", acknowledgement = ack-nhfb, articleno = "4", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Hyperspace Analog to Language (HAL) model; information flow; Information retrieval; query documents", } @Article{Kerne:2008:CMI, author = "Andruid Kerne and Eunyee Koh and Steven M. Smith and Andrew Webb and Blake Dworaczyk", title = "{combinFormation}: Mixed-initiative composition of image and text surrogates promotes information discovery", journal = j-TOIS, volume = "27", number = "1", pages = "5:1--5:??", month = dec, year = "2008", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1416950.1416955", ISSN = "1046-8188", bibdate = "Tue Dec 23 13:49:17 MST 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "combinFormation is a mixed-initiative creativity support tool for searching, browsing, organizing, and integrating information. Images and text are connected to represent surrogates (enhanced bookmarks), optimizing the use of human cognitive facilities. Composition, an alternative to lists and spatial hypertext, is used to represent a collection of surrogates as a connected whole, using principles from art and design. This facilitates the creative process of {\em information discovery}, in which humans develop new ideas while finding and collecting information. To provoke the user to think about the large space of potentially relevant information resources, a generative agent proactively engages in collecting information resources, forming image and text surrogates, and composing them visually. The agent develops the collection and its visual representation over time, enabling the user to see ideas and relationships. To keep the human in control, we develop interactive mechanisms for authoring the composition and directing the agent. In a field study in an interdisciplinary course on The Design Process, over a hundred students alternated using combinFormation and Google+Word to collect prior work on information discovery invention assignments. The students that used combinFormation's mixed-initiative composition of image and text surrogates performed better.", acknowledgement = ack-nhfb, articleno = "5", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "clustering; collections; creative cognition; Creativity support tools; exploratory search; field study; focused crawler; information discovery; mixed-initiative systems; relevance feedback; semantics; software agents", } @Article{Lin:2008:TAF, author = "Jimmy Lin and Philip Wu and Eileen Abels", title = "Toward automatic facet analysis and need negotiation: {Lessons} from mediated search", journal = j-TOIS, volume = "27", number = "1", pages = "6:1--6:??", month = dec, year = "2008", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1416950.1416956", ISSN = "1046-8188", bibdate = "Tue Dec 23 13:49:17 MST 2008", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "This work explores the hypothesis that interactions between a trained human search intermediary and an information seeker can inform the design of interactive IR systems. We discuss results from a controlled Wizard-of-Oz case study, set in the context of the TREC 2005 HARD track evaluation, in which a trained intermediary executed an integrated search and interaction strategy based on conceptual facet analysis and informed by need negotiation techniques common in reference interviews. Having a human ``in the loop'' yielded large improvements over fully automated systems as measured by standard ranked-retrieval metrics, demonstrating the value of mediated search. We present a detailed analysis of the intermediary's actions to gain a deeper understanding of what worked and why. One contribution is a taxonomy of clarification types informed both by empirical results and existing theories in library and information science. We discuss how these findings can guide the development of future systems. Overall, this work illustrates how studying human information-seeking processes can lead to better information retrieval applications.", acknowledgement = ack-nhfb, articleno = "6", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "interactive information retrieval; Reference interview", } @Article{Rodriguez:2009:AMG, author = "Marko A. Rodriguez and Johan Bollen and Herbert {Van De Sompel}", title = "Automatic metadata generation using associative networks", journal = j-TOIS, volume = "27", number = "2", pages = "7:1--7:??", month = feb, year = "2009", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1462198.1462199", ISSN = "1046-8188", bibdate = "Thu Mar 5 17:50:07 MST 2009", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "In spite of its tremendous value, metadata is generally sparse and incomplete, thereby hampering the effectiveness of digital information services. Many of the existing mechanisms for the automated creation of metadata rely primarily on content analysis which can be costly and inefficient. The automatic metadata generation system proposed in this article leverages resource relationships generated from existing metadata as a medium for propagation from metadata-rich to metadata-poor resources. Because of its independence from content analysis, it can be applied to a wide variety of resource media types and is shown to be computationally inexpensive. The proposed method operates through two distinct phases. Occurrence and cooccurrence algorithms first generate an associative network of repository resources leveraging existing repository metadata. Second, using the associative network as a substrate, metadata associated with metadata-rich resources is propagated to metadata-poor resources by means of a discrete-form spreading activation algorithm. This article discusses the general framework for building associative networks, an algorithm for disseminating metadata through such networks, and the results of an experiment and validation of the proposed method using a standard bibliographic dataset.", acknowledgement = ack-nhfb, articleno = "7", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Associative networks; metadata generation; particle-swarms", } @Article{Park:2009:ALS, author = "Laurence A. F. Park and Kotagiri Ramamohanarao", title = "An analysis of latent semantic term self-correlation", journal = j-TOIS, volume = "27", number = "2", pages = "8:1--8:??", month = feb, year = "2009", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1462198.1462200", ISSN = "1046-8188", bibdate = "Thu Mar 5 17:50:07 MST 2009", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Latent semantic analysis (LSA) is a generalized vector space method that uses dimension reduction to generate term correlations for use during the information retrieval process. We hypothesized that even though the dimension reduction establishes correlations between terms, the dimension reduction is causing a degradation in the correlation of a term to itself (self-correlation). In this article, we have proven that there is a direct relationship to the size of the LSA dimension reduction and the LSA self-correlation. We have also shown that by altering the LSA term self-correlations we gain a substantial increase in precision, while also reducing the computation required during the information retrieval process.", acknowledgement = ack-nhfb, articleno = "8", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Latent semantic analysis; term correlation", } @Article{Chen:2009:ATF, author = "Chien Chin Chen and Meng Chang Chen and Ming-Syan Chen", title = "An adaptive threshold framework for event detection using {HMM}-based life profiles", journal = j-TOIS, volume = "27", number = "2", pages = "9:1--9:??", month = feb, year = "2009", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1462198.1462201", ISSN = "1046-8188", bibdate = "Thu Mar 5 17:50:07 MST 2009", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "When an event occurs, it attracts attention of information sources to publish related documents along its lifespan. The task of event detection is to automatically identify events and their related documents from a document stream, which is a set of chronologically ordered documents collected from various information sources. Generally, each event has a distinct activeness development so that its status changes continuously during its lifespan. When an event is active, there are a lot of related documents from various information sources. In contrast when it is inactive, there are very few documents, but they are focused. Previous works on event detection did not consider the characteristics of the event's activeness, and used rigid thresholds for event detection. We propose a concept called life profile, modeled by a hidden Markov model, to model the activeness trends of events. In addition, a general event detection framework, LIPED, which utilizes the learned life profiles and the burst-and-diverse characteristic to adjust the event detection thresholds adaptively, can be incorporated into existing event detection methods. Based on the official TDT corpus and contest rules, the evaluation results show that existing detection methods that incorporate LIPED achieve better performance in the cost and F1 metrics, than without.", acknowledgement = ack-nhfb, articleno = "9", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "clustering; Event detection; hidden Markov models; life profiles; TDT; topic detection", } @Article{Tryfonopoulos:2009:IFQ, author = "Christos Tryfonopoulos and Manolis Koubarakis and Yannis Drougas", title = "Information filtering and query indexing for an information retrieval model", journal = j-TOIS, volume = "27", number = "2", pages = "10:1--10:??", month = feb, year = "2009", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1462198.1462202", ISSN = "1046-8188", bibdate = "Thu Mar 5 17:50:07 MST 2009", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "In the information filtering paradigm, clients subscribe to a server with continuous queries or profiles that express their information needs. Clients can also publish documents to servers. Whenever a document is published, the continuous queries satisfying this document are found and notifications are sent to appropriate clients. This article deals with the filtering problem that needs to be solved efficiently by each server: Given a database of continuous queries {\em db\/} and a document $d$, find all queries $q \in {\em db\/}$ that match $d$. We present data structures and indexing algorithms that enable us to solve the filtering problem efficiently for large databases of queries expressed in the model {\em AWP}. {\em AWP\/} is based on named attributes with values of type text, and its query language includes Boolean and word proximity operators.", acknowledgement = ack-nhfb, articleno = "10", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Information filtering; performance evaluation; query indexing algorithms; selective dissemination of information", } @Article{Xue:2009:ULM, author = "Gui-Rong Xue and Jie Han and Yong Yu and Qiang Yang", title = "User language model for collaborative personalized search", journal = j-TOIS, volume = "27", number = "2", pages = "11:1--11:??", month = feb, year = "2009", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1462198.1462203", ISSN = "1046-8188", bibdate = "Thu Mar 5 17:50:07 MST 2009", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Traditional personalized search approaches rely solely on individual profiles to construct a user model. They are often confronted by two major problems: data sparseness and cold-start for new individuals. Data sparseness refers to the fact that most users only visit a small portion of Web pages and hence a very sparse user-term relationship matrix is generated, while cold-start for new individuals means that the system cannot conduct any personalization without previous browsing history. Recently, community-based approaches were proposed to use the group's social behaviors as a supplement to personalization. However, these approaches only consider the commonality of a group of users and still cannot satisfy the diverse information needs of different users. In this article, we present a new approach, called collaborative personalized search. It considers not only the commonality factor among users for defining group user profiles and global user profiles, but also the specialties of individuals. Then, a statistical user language model is proposed to integrate the individual model, group user model and global user model together. In this way, the probability that a user will like a Web page is calculated through a two-step smoothing mechanism. First, a global user model is used to smooth the probability of unseen terms in the individual profiles and provide aggregated behavior of global users. Then, in order to precisely describe individual interests by looking at the behaviors of similar users, users are clustered into groups and group-user models are constructed. The group-user models are integrated into an overall model through a cluster-based language model. The behaviors of the group users can be utilized to enhance the performance of personalized search. This model can alleviate the two aforementioned problems and provide a more effective personalized search than previous approaches. Large-scale experimental evaluations are conducted to show that the proposed approach substantially improves the relevance of a search over several competitive methods.", acknowledgement = ack-nhfb, articleno = "11", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "clustering; cold-start; Collaborative personalized search; data Sparseness; smoothing; user language model", } @Article{Schumaker:2009:TAS, author = "Robert P. Schumaker and Hsinchun Chen", title = "Textual analysis of stock market prediction using breaking financial news: {The} {AZFin} text system", journal = j-TOIS, volume = "27", number = "2", pages = "12:1--12:??", month = feb, year = "2009", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1462198.1462204", ISSN = "1046-8188", bibdate = "Thu Mar 5 17:50:07 MST 2009", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Our research examines a predictive machine learning approach for financial news articles analysis using several different textual representations: bag of words, noun phrases, and named entities. Through this approach, we investigated 9,211 financial news articles and 10,259,042 stock quotes covering the S\&P 500 stocks during a five week period. We applied our analysis to estimate a discrete stock price twenty minutes after a news article was released. Using a support vector machine (SVM) derivative specially tailored for discrete numeric prediction and models containing different stock-specific variables, we show that the model containing both article terms and stock price at the time of article release had the best performance in closeness to the actual future stock price (MSE 0.04261), the same direction of price movement as the future price (57.1\% directional accuracy) and the highest return using a simulated trading engine (2.06\% return). We further investigated the different textual representations and found that a Proper Noun scheme performs better than the de facto standard of Bag of Words in all three metrics.", acknowledgement = ack-nhfb, articleno = "12", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "prediction; stock market; SVM", } @Article{Kurland:2009:CLM, author = "Oren Kurland and Lillian Lee", title = "Clusters, language models, and ad hoc information retrieval", journal = j-TOIS, volume = "27", number = "3", pages = "13:1--13:??", month = may, year = "2009", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1508850.1508851", ISSN = "1046-8188", bibdate = "Wed May 20 13:44:20 MDT 2009", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The language-modeling approach to information retrieval provides an effective statistical framework for tackling various problems and often achieves impressive empirical performance. However, most previous work on language models for information retrieval focused on document-specific characteristics, and therefore did not take into account the structure of the surrounding corpus, a potentially rich source of additional information. We propose a novel algorithmic framework in which information provided by document-based language models is enhanced by the incorporation of information drawn from {\em clusters\/} of similar documents. Using this framework, we develop a suite of new algorithms. Even the simplest typically outperforms the standard language-modeling approach in terms of mean average precision (MAP) and recall, and our new {\em interpolation\/} algorithm posts statistically significant performance improvements for both metrics over all six corpora tested. An important aspect of our work is the way we model corpus structure. In contrast to most previous work on cluster-based retrieval that partitions the corpus, we demonstrate the effectiveness of a simple strategy based on a nearest-neighbors approach that produces overlapping clusters.", acknowledgement = ack-nhfb, articleno = "13", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "aspect models; cluster hypothesis; cluster-based language models; clustering; interpolation model; Language modeling; smoothing", } @Article{Shokouhi:2009:RRM, author = "Milad Shokouhi and Justin Zobel", title = "Robust result merging using sample-based score estimates", journal = j-TOIS, volume = "27", number = "3", pages = "14:1--14:??", month = may, year = "2009", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1508850.1508852", ISSN = "1046-8188", bibdate = "Wed May 20 13:44:20 MDT 2009", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "In federated information retrieval, a query is routed to multiple collections and a single answer list is constructed by combining the results. Such metasearch provides a mechanism for locating documents on the hidden Web and, by use of sampling, can proceed even when the collections are uncooperative. However, the similarity scores for documents returned from different collections are not comparable, and, in uncooperative environments, document scores are unlikely to be reported. We introduce a new merging method for uncooperative environments, in which similarity scores for the sampled documents held for each collection are used to estimate global scores for the documents returned per query. This method requires no assumptions about properties such as the retrieval models used. Using experiments on a wide range of collections, we show that in many cases our merging methods are significantly more effective than previous techniques.", acknowledgement = ack-nhfb, articleno = "14", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "distributed information retrieval; result fusion; Result merging; uncooperative collections", } @Article{Candan:2009:SSE, author = "K. Sel{\c{c}}uk Candan and Mehmet E. D{\"o}nderler and Terri Hedgpeth and Jong Wook Kim and Qing Li and Maria Luisa Sapino", title = "{SEA}: {Segment-enrich-annotate} paradigm for adapting dialog-based content for improved accessibility", journal = j-TOIS, volume = "27", number = "3", pages = "15:1--15:??", month = may, year = "2009", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1508850.1508853", ISSN = "1046-8188", bibdate = "Wed May 20 13:44:20 MDT 2009", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "While navigation within complex information spaces is a problem for all users, the problem is most evident with individuals who are blind who cannot simply locate, point, and click on a link in hypertext documents with a mouse. Users who are blind have to listen searching for the link in the document using only the keyboard and a screen reader program, which may be particularly inefficient in large documents with many links or deep hierarchies that are hard to navigate. Consequently, they are especially penalized when the information being searched is hidden under multiple layers of indirections. In this article, we introduce a {\em segment-enrich-annotate\/} (SEA) paradigm for adapting digital content with deep structures for improved accessibility. In particular, we instantiate and evaluate this paradigm through the iCare-Assistant, an assistive system for helping students who are blind in accessing Web and electronic course materials. Our evaluations, involving the participation of students who are blind, showed that the iCare-Assistant system, built based on the SEA paradigm, reduces the navigational overhead significantly and enables user who are blind access complex online course servers effectively.", acknowledgement = ack-nhfb, articleno = "15", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "annotation; assistive technology for blind users; educational discussion boards and Web sites; segmentation; Web navigational aids", } @Article{Hoi:2009:SSB, author = "Steven C. H. Hoi and Rong Jin and Jianke Zhu and Michael R. Lyu", title = "Semisupervised {SVM} batch mode active learning with applications to image retrieval", journal = j-TOIS, volume = "27", number = "3", pages = "16:1--16:??", month = may, year = "2009", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1508850.1508854", ISSN = "1046-8188", bibdate = "Wed May 20 13:44:20 MDT 2009", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Support vector machine (SVM) active learning is one popular and successful technique for relevance feedback in content-based image retrieval (CBIR). Despite the success, conventional SVM active learning has two main drawbacks. First, the performance of SVM is usually limited by the number of labeled examples. It often suffers a poor performance for the small-sized labeled examples, which is the case in relevance feedback. Second, conventional approaches do not take into account the redundancy among examples, and could select multiple examples that are similar (or even identical). In this work, we propose a novel scheme for explicitly addressing the drawbacks. It first learns a kernel function from a mixture of labeled and unlabeled data, and therefore alleviates the problem of small-sized training data. The kernel will then be used for a batch mode active learning method to identify the most informative and diverse examples via a min-max framework. Two novel algorithms are proposed to solve the related combinatorial optimization: the first approach approximates the problem into a quadratic program, and the second solves the combinatorial optimization approximately by a greedy algorithm that exploits the merits of submodular functions. Extensive experiments with image retrieval using both natural photo images and medical images show that the proposed algorithms are significantly more effective than the state-of-the-art approaches. A demo is available at http://msm.cais.ntu.edu.sg/LSCBIR/.", acknowledgement = ack-nhfb, articleno = "16", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "active learning; batch mode active learning; Content-based image retrieval; human-computer interaction; semisupervised learning; support vector machines", } @Article{Huang:2009:BCS, author = "Zi Huang and Heng Tao Shen and Jie Shao and Xiaofang Zhou and Bin Cui", title = "Bounded coordinate system indexing for real-time video clip search", journal = j-TOIS, volume = "27", number = "3", pages = "17:1--17:??", month = may, year = "2009", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1508850.1508855", ISSN = "1046-8188", bibdate = "Wed May 20 13:44:20 MDT 2009", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Recently, video clips have become very popular online. The massive influx of video clips has created an urgent need for video search engines to facilitate retrieving relevant clips. Different from traditional long videos, a video clip is a short video often expressing a moment of significance. Due to the high complexity of video data, efficient video clip search from large databases turns out to be very challenging. We propose a novel video clip representation model called the {\em Bounded Coordinate System\/} (BCS), which is the first single representative capturing the dominating content and content --- changing trends of a video clip. It summarizes a video clip by a coordinate system, where each of its coordinate axes is identified by principal component analysis (PCA) and bounded by the range of data projections along the axis. The similarity measure of BCS considers the operations of translation, rotation, and scaling for coordinate system matching. Particularly, rotation and scaling reflect the difference of content tendencies. Compared with the quadratic time complexity of existing methods, the time complexity of measuring BCS similarity is linear. The compact video representation together with its linear similarity measure makes real-time search from video clip collections feasible. To further improve the retrieval efficiency for large video databases, a two-dimensional transformation method called {\em Bidistance Transformation\/} (BDT) is introduced to utilize a pair of optimal reference points with respect to bidirectional axes in BCS. Our extensive performance study on a large database of more than 30,000 video clips demonstrates that BCS achieves very high search accuracy according to human judgment. This indicates that content tendencies are important in determining the meanings of video clips and confirms that BCS can capture the inherent moment of video clip to some extent that better resembles human perception. In addition, BDT outperforms existing indexing methods greatly. Integration of the BCS model and BDT indexing can achieve real-time search from large video clip databases.", acknowledgement = ack-nhfb, articleno = "17", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "indexing; query processing; summarization; Video search", } @Article{Shen:2009:NFE, author = "Jialie Shen and John Shepherd and Bin Cui and Kian-Lee Tan", title = "A novel framework for efficient automated singer identification in large music databases", journal = j-TOIS, volume = "27", number = "3", pages = "18:1--18:??", month = may, year = "2009", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1508850.1508856", ISSN = "1046-8188", bibdate = "Wed May 20 13:44:20 MDT 2009", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Over the past decade, there has been explosive growth in the availability of multimedia data, particularly image, video, and music. Because of this, content-based music retrieval has attracted attention from the multimedia database and information retrieval communities. Content-based music retrieval requires us to be able to automatically identify particular characteristics of music data. One such characteristic, useful in a range of applications, is the identification of the singer in a musical piece. Unfortunately, existing approaches to this problem suffer from either low accuracy or poor scalability. In this article, we propose a novel scheme, called {\em Hybrid Singer Identifier\/} (HSI), for efficient automated singer recognition. HSI uses multiple low-level features extracted from both vocal and nonvocal music segments to enhance the identification process; it achieves this via a hybrid architecture that builds profiles of individual singer characteristics based on statistical mixture models. An extensive experimental study on a large music database demonstrates the superiority of our method over state-of-the-art approaches in terms of effectiveness, efficiency, scalability, and robustness.", acknowledgement = ack-nhfb, articleno = "18", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "classification; EM algorithm; evaluation; Gaussian mixture models; Music retrieval; singer identification; statistical modeling", } @Article{Boldi:2009:PFD, author = "Paolo Boldi and Massimo Santini and Sebastiano Vigna", title = "{PageRank}: {Functional} dependencies", journal = j-TOIS, volume = "27", number = "4", pages = "19:1--19:??", month = nov, year = "2009", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Mon Mar 15 12:37:02 MDT 2010", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, articleno = "19", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Dang:2009:BFP, author = "Edward Kai Fung Dang and Ho Chung Wu and Robert Wing Pong Luk and Kam Fai Wong", title = "Building a framework for the probability ranking principle by a family of expected weighted rank", journal = j-TOIS, volume = "27", number = "4", pages = "20:1--20:??", month = nov, year = "2009", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Mon Mar 15 12:37:02 MDT 2010", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, articleno = "20", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Guiver:2009:FGT, author = "John Guiver and Stefano Mizzaro and Stephen Robertson", title = "A few good topics: {Experiments} in topic set reduction for retrieval evaluation", journal = j-TOIS, volume = "27", number = "4", pages = "21:1--21:??", month = nov, year = "2009", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Mon Mar 15 12:37:02 MDT 2010", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, articleno = "21", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Dupplaw:2009:DSB, author = "David Dupplaw and Srinandan Dasmahapatra and Bo Hu and Paul Lewis and Nigel Shadbolt", title = "A distributed, service-based framework for knowledge applications with multimedia", journal = j-TOIS, volume = "27", number = "4", pages = "22:1--22:??", month = nov, year = "2009", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Mon Mar 15 12:37:02 MDT 2010", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, articleno = "22", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{White:2009:CSE, author = "Ryen W. White and Eric Horvitz", title = "Cyberchondria: {Studies} of the escalation of medical concerns in {Web} search", journal = j-TOIS, volume = "27", number = "4", pages = "23:1--23:??", month = nov, year = "2009", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Mon Mar 15 12:37:02 MDT 2010", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, articleno = "23", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Rosaci:2009:MDR, author = "Domenico Rosaci and Giuseppe M. L. Sarn{\'e} and Salvatore Garruzzo", title = "{MUADDIB}: a distributed recommender system supporting device adaptivity", journal = j-TOIS, volume = "27", number = "4", pages = "24:1--24:??", month = nov, year = "2009", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Mon Mar 15 12:37:02 MDT 2010", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, articleno = "24", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Blanco:2010:PSP, author = "Roi Blanco and Alvaro Barreiro", title = "Probabilistic static pruning of inverted files", journal = j-TOIS, volume = "28", number = "1", pages = "1:1--1:??", month = jan, year = "2010", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Mon Mar 15 12:37:04 MDT 2010", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, articleno = "1", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Chia:2010:SLB, author = "Tee Kiah Chia and Khe Chai Sim and Haizhou Li and Hwee Tou Ng", title = "Statistical lattice-based spoken document retrieval", journal = j-TOIS, volume = "28", number = "1", pages = "2:1--2:??", month = jan, year = "2010", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Mon Mar 15 12:37:04 MDT 2010", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, articleno = "2", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Tagarelli:2010:SCX, author = "Andrea Tagarelli and Sergio Greco", title = "Semantic clustering of {XML} documents", journal = j-TOIS, volume = "28", number = "1", pages = "3:1--3:??", month = jan, year = "2010", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Mon Mar 15 12:37:04 MDT 2010", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, articleno = "3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Rosen-Zvi:2010:LAT, author = "Michal Rosen-Zvi and Chaitanya Chemudugunta and Thomas Griffiths and Padhraic Smyth and Mark Steyvers", title = "Learning author-topic models from text corpora", journal = j-TOIS, volume = "28", number = "1", pages = "4:1--4:??", month = jan, year = "2010", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Mon Mar 15 12:37:04 MDT 2010", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, articleno = "4", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Puppin:2010:TCS, author = "Diego Puppin and Fabrizio Silvestri and Raffaele Perego and Ricardo Baeza-Yates", title = "Tuning the capacity of search engines: {Load-driven} routing and incremental caching to reduce and balance the load", journal = j-TOIS, volume = "28", number = "2", pages = "5:1--5:??", month = may, year = "2010", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1740592.1740593", ISSN = "1046-8188", bibdate = "Mon Jun 21 17:30:54 MDT 2010", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "This article introduces an architecture for a document-partitioned search engine, based on a novel approach combining collection selection and load balancing, called {\em load-driven routing}. By exploiting the query-vector document model, and the incremental caching technique, our architecture can compute very high quality results for any query, with only a fraction of the computational load used in a typical document-partitioned architecture. By trading off a small fraction of the results, our technique allows us to strongly reduce the computing pressure to a search engine back-end; we are able to retrieve more than 2/3 of the top-5 results for a given query with only 10\% the computing load needed by a configuration where the query is processed by each index partition. Alternatively, we can slightly increase the load up to 25\% to improve precision and get more than 80\% of the top-5 results. In fact, the flexibility of our system allows a wide range of different configurations, so as to easily respond to different needs in result quality or restrictions in computing power. More important, the system configuration can be adjusted dynamically in order to fit unexpected query peaks or unpredictable failures. This article wraps up some recent works by the authors, showing the results obtained by tests conducted on 6 million documents, 2,800,000 queries and real query cost timing as measured on an actual index.", acknowledgement = ack-nhfb, articleno = "5", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "collection selection; Distributed IR; incremental caching; Web search engines", } @Article{Gao:2010:EQL, author = "Wei Gao and Cheng Niu and Jian-Yun Nie and Ming Zhou and Kam-Fai Wong and Hsiao-Wuen Hon", title = "Exploiting query logs for cross-lingual query suggestions", journal = j-TOIS, volume = "28", number = "2", pages = "6:1--6:??", month = may, year = "2010", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1740592.1740594", ISSN = "1046-8188", bibdate = "Mon Jun 21 17:30:54 MDT 2010", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Query suggestion aims to suggest relevant queries for a given query, which helps users better specify their information needs. Previous work on query suggestion has been limited to the same language. In this article, we extend it to cross-lingual query suggestion (CLQS): for a query in one language, we suggest similar or relevant queries in other languages. This is very important to the scenarios of cross-language information retrieval (CLIR) and other related cross-lingual applications. Instead of relying on existing query translation technologies for CLQS, we present an effective means to map the input query of one language to queries of the other language in the query log. Important monolingual and cross-lingual information such as word translation relations and word co-occurrence statistics, and so on, are used to estimate the cross-lingual query similarity with a discriminative model. Benchmarks show that the resulting CLQS system significantly outperforms a baseline system that uses dictionary-based query translation. Besides, we evaluate CLQS with French-English and Chinese--English CLIR tasks on TREC-6 and NTCIR-4 collections, respectively. The CLIR experiments using typical retrieval models demonstrate that the CLQS-based approach has significantly higher effectiveness than several traditional query translation methods. We find that when combined with pseudo-relevance feedback, the effectiveness of CLIR using CLQS is enhanced for different pairs of languages.", acknowledgement = ack-nhfb, articleno = "6", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Cross-language information retrieval; query expansion; query log; query suggestion; query translation", } @Article{Kolbe:2010:ENN, author = "Dashiell Kolbe and Qiang Zhu and Sakti Pramanik", title = "Efficient $k$-nearest neighbor searching in nonordered discrete data spaces", journal = j-TOIS, volume = "28", number = "2", pages = "7:1--7:??", month = may, year = "2010", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1740592.1740595", ISSN = "1046-8188", bibdate = "Mon Jun 21 17:30:54 MDT 2010", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Numerous techniques have been proposed in the past for supporting efficient {\em k\/} -nearest neighbor ({\em k\/} -NN) queries in continuous data spaces. Limited work has been reported in the literature for {\em k\/} -NN queries in a nonordered discrete data space (NDDS). Performing {\em k\/} -NN queries in an NDDS raises new challenges. The Hamming distance is usually used to measure the distance between two vectors (objects) in an NDDS. Due to the coarse granularity of the Hamming distance, a {\em k\/} -NN query in an NDDS may lead to a high degree of nondeterminism for the query result. We propose a new distance measure, called Granularity-Enhanced Hamming (GEH) distance, which effectively reduces the number of candidate solutions for a query. We have also implemented {\em k\/} -NN queries using multidimensional database indexing in NDDSs. Further, we use the properties of our multidimensional NDDS index to derive the probability of encountering valid neighbors within specific regions of the index. This probability is used to develop a new search ordering heuristic. Our experiments on synthetic and genomic data sets demonstrate that our index-based {\em k\/} -NN algorithm is efficient in finding {\em k\/} -NNs in both uniform and nonuniform data sets in NDDSs and that our heuristics are effective in improving the performance of such queries.", acknowledgement = ack-nhfb, articleno = "7", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "database; distance measurement; nearest neighbor; nonordered discrete data space; Similarity search; spatial indexing", } @Article{Wan:2010:ENK, author = "Xiaojun Wan and Jianguo Xiao", title = "Exploiting neighborhood knowledge for single document summarization and keyphrase extraction", journal = j-TOIS, volume = "28", number = "2", pages = "8:1--8:??", month = may, year = "2010", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1740592.1740596", ISSN = "1046-8188", bibdate = "Mon Jun 21 17:30:54 MDT 2010", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Document summarization and keyphrase extraction are two related tasks in the IR and NLP fields, and both of them aim at extracting condensed representations from a single text document. Existing methods for single document summarization and keyphrase extraction usually make use of only the information contained in the specified document. This article proposes using a small number of nearest neighbor documents to improve document summarization and keyphrase extraction for the specified document, under the assumption that the neighbor documents could provide additional knowledge and more clues. The specified document is expanded to a small document set by adding a few neighbor documents close to the document, and the graph-based ranking algorithm is then applied on the expanded document set to make use of both the local information in the specified document and the global information in the neighbor documents. Experimental results on the Document Understanding Conference (DUC) benchmark datasets demonstrate the effectiveness and robustness of our proposed approaches. The cross-document sentence relationships in the expanded document set are validated to be beneficial to single document summarization, and the word cooccurrence relationships in the neighbor documents are validated to be very helpful to single document keyphrase extraction.", acknowledgement = ack-nhfb, articleno = "8", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Document summarization; graph-based ranking; keyphrase extraction; neighborhood knowledge", } @Article{Kelly:2010:EPN, author = "Diane Kelly and Xin Fu and Chirag Shah", title = "Effects of position and number of relevant documents retrieved on users' evaluations of system performance", journal = j-TOIS, volume = "28", number = "2", pages = "9:1--9:??", month = may, year = "2010", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1740592.1740597", ISSN = "1046-8188", bibdate = "Mon Jun 21 17:30:54 MDT 2010", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Information retrieval research has demonstrated that system performance does not always correlate positively with user performance, and that users often assign positive evaluation scores to search systems even when they are unable to complete tasks successfully. This research investigated the relationship between objective measures of system performance and users' perceptions of that performance. In this study, subjects evaluated the performance of four search systems whose search results were manipulated systematically to produce different orderings and numbers of relevant documents. Three laboratory studies were conducted with a total of eighty-one subjects. The first two studies investigated the effect of the order of five relevant and five nonrelevant documents in a search results list containing ten results on subjects' evaluations. The third study investigated the effect of varying the number of relevant documents in a search results list containing ten results on subjects' evaluations. Results demonstrate linear relationships between subjects' evaluations and the position of relevant documents in a search results list and the total number of relevant documents retrieved. Of the two, number of relevant documents retrieved was a stronger predictor of subjects' evaluation ratings and resulted in subjects using a greater range of evaluation scores.", acknowledgement = ack-nhfb, articleno = "9", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "precision; presentation of search results; ranking; satisfaction; Search performance; user evaluation of performance", } @Article{Brisaboa:2010:DLT, author = "Nieves Brisaboa and Antonio Fari{\~n}a and Gonzalo Navarro and Jos{\'e} Param{\'a}", title = "Dynamic lightweight text compression", journal = j-TOIS, volume = "28", number = "3", pages = "10:1--10:??", month = jun, year = "2010", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1777432.1777433", ISSN = "1046-8188", bibdate = "Tue Jul 6 15:53:00 MDT 2010", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "We address the problem of adaptive compression of natural language text, considering the case where the receiver is much less powerful than the sender, as in mobile applications. Our techniques achieve compression ratios around 32\% and require very little effort from the receiver. Furthermore, the receiver is not only lighter, but it can also search the compressed text with less work than that necessary to decompress it. This is a novelty in two senses: it breaks the usual compressor/decompressor symmetry typical of adaptive schemes, and it contradicts the long-standing assumption that only semistatic codes could be searched more efficiently than the uncompressed text. Our novel compression methods are preferable in several aspects over the existing adaptive and semistatic compressors for natural language texts.", acknowledgement = ack-nhfb, articleno = "10", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "adaptive natural language text compression; compressed pattern matching; real-time transmission; searching compressed texts; text compression", } @Article{Wu:2010:AVG, author = "Gang Wu and Yimin Wei", title = "{Arnoldi} versus {GMRES} for computing {PageRank}: a theoretical contribution to {Google}'s {PageRank} problem", journal = j-TOIS, volume = "28", number = "3", pages = "11:1--11:28", month = jun, year = "2010", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1777432.1777434", ISSN = "1046-8188", bibdate = "Tue Jul 6 15:53:00 MDT 2010", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "PageRank is one of the most important ranking techniques used in today's search engines. A recent very interesting research track focuses on exploiting efficient numerical methods to speed up the computation of PageRank, among which the Arnoldi-type algorithm and the GMRES algorithm are competitive candidates. In essence, the former deals with the PageRank problem from an eigenproblem, while the latter from a linear system, point of view. However, there is little known about the relations between the two approaches for PageRank. In this article, we focus on a theoretical and numerical comparison of the two approaches. Numerical experiments illustrate the effectiveness of our theoretical results.", acknowledgement = ack-nhfb, articleno = "11", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "Arnoldi; GMRES; Google; Krylov subspace; PageRank; Web ranking", } @Article{Li:2010:LCG, author = "Xiao Li and Ye-Yi Wang and Dou Shen and Alex Acero", title = "Learning with click graph for query intent classification", journal = j-TOIS, volume = "28", number = "3", pages = "12:1--12:??", month = jun, year = "2010", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1777432.1777435", ISSN = "1046-8188", bibdate = "Tue Jul 6 15:53:00 MDT 2010", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Topical query classification, as one step toward understanding users' search intent, is gaining increasing attention in information retrieval. Previous works on this subject primarily focused on enrichment of query features, for example, by augmenting queries with search engine results. In this work, we investigate a completely orthogonal approach --- instead of improving feature representation, we aim at drastically increasing the amount of training data. To this end, we propose two semisupervised learning methods that exploit user click-through data. In one approach, we infer class memberships of unlabeled queries from those of labeled ones according to their proximities in a click graph; and then use these automatically labeled queries to train classifiers using query terms as features. In a second approach, click graph learning and query classifier training are conducted jointly with an integrated objective. Our methods are evaluated in two applications, product intent and job intent classification. In both cases, we expand the training data by over two orders of magnitude, leading to significant improvements in classification performance. An additional finding is that with a large amount of training data obtained in this fashion, a classifier based on simple query term features can outperform those using state-of-the-art, augmented features.", acknowledgement = ack-nhfb, articleno = "12", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "click graph; query classification; semisupervised learning; user intent", } @Article{Harabagiu:2010:UTT, author = "Sanda Harabagiu and Finley Lacatusu", title = "Using topic themes for multi-document summarization", journal = j-TOIS, volume = "28", number = "3", pages = "13:1--13:??", month = jun, year = "2010", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1777432.1777436", ISSN = "1046-8188", bibdate = "Tue Jul 6 15:53:00 MDT 2010", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The problem of using topic representations for multidocument summarization (MDS) has received considerable attention recently. Several topic representations have been employed for producing informative and coherent summaries. In this article, we describe five previously known topic representations and introduce two novel representations of topics based on topic themes. We present eight different methods of generating multidocument summaries and evaluate each of these methods on a large set of topics used in past DUC workshops. Our evaluation results show a significant improvement in the quality of summaries based on topic themes over MDS methods that use other alternative topic representations.", acknowledgement = ack-nhfb, articleno = "13", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "summarization; topic representations; topic themes", } @Article{Maslennikov:2010:CRI, author = "Mstislav Maslennikov and Tat-Seng Chua", title = "Combining relations for information extraction from free text", journal = j-TOIS, volume = "28", number = "3", pages = "14:1--14:??", month = jun, year = "2010", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1777432.1777437", ISSN = "1046-8188", bibdate = "Tue Jul 6 15:53:00 MDT 2010", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Relations between entities of the same semantic type tend to be sparse in free texts. Therefore, combining relations is the key to effective information extraction (IE) on free text datasets with a small set of training samples. Previous approaches to bootstrapping for IE used different types of relations, such as dependency or co-occurrence, and faced the problems of paraphrasing and misalignment of instances. To cope with these problems, we propose a framework that integrates several types of relations. After extracting candidate entities, our framework evaluates relations between them at the phrasal, dependency, semantic frame, and discourse levels. For each of these levels, we build a classifier that outputs a score for relation instances. In order to integrate these scores, we propose three strategies: (1) integrate evaluation scores from each relation classifier; (2) incorporate the elimination of negatively labeled instances in a previous strategy; and (3) add cascading of extracted relations into strategy (1). Our framework improves the state-of-art results for supervised systems by 8\%, 15\%, 3\%, and 5\% on MUC4 (terrorism); MUC6 (management succession); ACE RDC 2003 (news, general types); and ACE RDC 2003 (news, specific types) domains respectively.", acknowledgement = ack-nhfb, articleno = "14", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "bootstrapping; dependency relations; discourse relations; information extraction; semantic relations", } @Article{Lauw:2010:SST, author = "Hady W. Lauw and Ee-Peng Lim and Hweehwa Pang and Teck-Tim Tan", title = "{STEvent}: {Spatio-temporal} event model for social network discovery", journal = j-TOIS, volume = "28", number = "3", pages = "15:1--15:??", month = jun, year = "2010", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1777432.1777438", ISSN = "1046-8188", bibdate = "Tue Jul 6 15:53:00 MDT 2010", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Spatio-temporal data concerning the movement of individuals over space and time contains latent information on the associations among these individuals. Sources of spatio-temporal data include usage logs of mobile and Internet technologies. This article defines a spatio-temporal event by the co-occurrences among individuals that indicate potential associations among them. Each spatio-temporal event is assigned a weight based on the precision and uniqueness of the event. By aggregating the weights of events relating two individuals, we can determine the strength of association between them. We conduct extensive experimentation to investigate both the efficacy of the proposed model as well as the computational complexity of the proposed algorithms. Experimental results on three real-life spatio-temporal datasets cross-validate each other, lending greater confidence on the reliability of our proposed model.", acknowledgement = ack-nhfb, articleno = "15", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "data mining; social network; spatio-temporal databases", } @Article{Ko:2010:PMA, author = "Jeongwoo Ko and Luo Si and Eric Nyberg and Teruko Mitamura", title = "Probabilistic models for answer-ranking in multilingual question-answering", journal = j-TOIS, volume = "28", number = "3", pages = "16:1--16:??", month = jun, year = "2010", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1777432.1777439", ISSN = "1046-8188", bibdate = "Tue Jul 6 15:53:00 MDT 2010", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "This article presents two probabilistic models for answering ranking in the multilingual question-answering (QA) task, which finds exact answers to a natural language question written in different languages. Although some probabilistic methods have been utilized in traditional monolingual answer-ranking, limited prior research has been conducted for answer-ranking in multilingual question-answering with formal methods. This article first describes a probabilistic model that predicts the probabilities of correctness for individual answers in an independent way. It then proposes a novel probabilistic method to jointly predict the correctness of answers by considering both the correctness of individual answers as well as their correlations. As far as we know, this is the first probabilistic framework that proposes to model the correctness and correlation of answer candidates in multilingual question-answering and provide a novel approach to design a flexible and extensible system architecture for answer selection in multilingual QA. An extensive set of experiments were conducted to show the effectiveness of the proposed probabilistic methods in English-to-Chinese and English-to-Japanese cross-lingual QA, as well as English, Chinese, and Japanese monolingual QA using TREC and NTCIR questions.", acknowledgement = ack-nhfb, articleno = "16", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", keywords = "answer selection; answer-merging; answer-ranking; probabilistic graphical model; question-answering", } @Article{Tan:2010:CBI, author = "Qingzhao Tan and Prasenjit Mitra", title = "Clustering-based incremental {Web} crawling", journal = j-TOIS, volume = "28", number = "4", pages = "17:1--17:??", month = nov, year = "2010", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1852102.1852103", ISSN = "1046-8188", bibdate = "Tue Nov 23 10:24:49 MST 2010", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "When crawling resources, for example, number of machines, crawl-time, and so on, are limited, so a crawler has to decide an optimal order in which to crawl and recrawl Web pages. Ideally, crawlers should request only those Web pages that have changed since the last crawl; in practice, a crawler may not know whether a Web page has changed before downloading it. In this article, we identify features of Web pages that are correlated to their change frequency. We design a crawling algorithm that clusters Web pages based on features that correlate to their change frequencies obtained by examining past history.", acknowledgement = ack-nhfb, articleno = "17", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Kurland:2010:PHS, author = "Oren Kurland and Lillian Lee", title = "{PageRank} without hyperlinks: {Structural} reranking using links induced by language models", journal = j-TOIS, volume = "28", number = "4", pages = "18:1--18:??", month = nov, year = "2010", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1852102.1852104", ISSN = "1046-8188", bibdate = "Tue Nov 23 10:24:49 MST 2010", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The ad hoc retrieval task is to find documents in a corpus that are relevant to a query. Inspired by the PageRank and HITS (hubs and authorities) algorithms for Web search, we propose a structural reranking approach to ad-hoc retrieval that applies to settings with no hyperlink information. We reorder the documents in an initially retrieved set by exploiting implicit asymmetric relationships among them. We consider generation links, which indicate that the language model induced from one document assigns high probability to the text of another. We study a number of reranking criteria based on measures of centrality in the graphs formed by generation links, and show that integrating centrality into standard language-model-based retrieval is quite effective at improving precision at top ranks; the best resultant performance is comparable, and often superior, to that of a state-of-the-art pseudo-feedback-based retrieval approach.", acknowledgement = ack-nhfb, articleno = "18", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Magalhaes:2010:ITF, author = "Jo{\~a}o Magalh{\~a}es and Stefan R{\"u}ger", title = "An information-theoretic framework for semantic-multimedia retrieval", journal = j-TOIS, volume = "28", number = "4", pages = "19:1--19:??", month = nov, year = "2010", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1852102.1852105", ISSN = "1046-8188", bibdate = "Tue Nov 23 10:24:49 MST 2010", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "This article is set in the context of searching text and image repositories by keyword. We develop a unified probabilistic framework for text, image, and combined text and image retrieval that is based on the detection of keywords (concepts) using automated image annotation technology. Our framework is deeply rooted in information theory and lends itself to use with other media types. We estimate a statistical model in a multimodal feature space for each possible query keyword. The key element of our framework is to identify feature space transformations that make them comparable in complexity and density. We select the optimal multimodal feature space with a minimum description length criterion from a set of candidate feature spaces that are computed with the average-mutual-information criterion for the text part and hierarchical expectation maximization for the visual part of the data.", acknowledgement = ack-nhfb, articleno = "19", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Webber:2010:SMI, author = "William Webber and Alistair Moffat and Justin Zobel", title = "A similarity measure for indefinite rankings", journal = j-TOIS, volume = "28", number = "4", pages = "20:1--20:??", month = nov, year = "2010", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1852102.1852106", ISSN = "1046-8188", bibdate = "Tue Nov 23 10:24:49 MST 2010", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Ranked lists are encountered in research and daily life and it is often of interest to compare these lists even when they are incomplete or have only some members in common. An example is document rankings returned for the same query by different search engines. A measure of the similarity between incomplete rankings should handle nonconjointness, weight high ranks more heavily than low, and be monotonic with increasing depth of evaluation; but no measure satisfying all these criteria currently exists. In this article, we propose a new measure having these qualities, namely rank-biased overlap (RBO). The RBO measure is based on a simple probabilistic user model.", acknowledgement = ack-nhfb, articleno = "20", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Clements:2010:TDE, author = "Maarten Clements and Arjen P. {De Vries} and Marcel J. T. Reinders", title = "The task-dependent effect of tags and ratings on social media access", journal = j-TOIS, volume = "28", number = "4", pages = "21:1--21:??", month = nov, year = "2010", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1852102.1852107", ISSN = "1046-8188", bibdate = "Tue Nov 23 10:24:49 MST 2010", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Recently, online social networks have emerged that allow people to share their multimedia files, retrieve interesting content, and discover like-minded people. These systems often provide the possibility to annotate the content with tags and ratings. Using a random walk through the social annotation graph, we have combined these annotations into a retrieval model that effectively balances the personal preferences and opinions of like-minded users into a single relevance ranking for either content, tags, or people. We use this model to identify the influence of different annotation methods and system design aspects on common ranking tasks in social content systems. Our results show that a combination of rating and tagging information can improve tasks like search and recommendation.", acknowledgement = ack-nhfb, articleno = "21", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Huang:2010:MND, author = "Zi Huang and Bo Hu and Hong Cheng and Heng Tao Shen and Hongyan Liu and Xiaofang Zhou", title = "Mining near-duplicate graph for cluster-based reranking of {Web} video search results", journal = j-TOIS, volume = "28", number = "4", pages = "22:1--22:??", month = nov, year = "2010", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1852102.1852108", ISSN = "1046-8188", bibdate = "Tue Nov 23 10:24:49 MST 2010", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Recently, video search reranking has been an effective mechanism to improve the initial text-based ranking list by incorporating visual consistency among the result videos. While existing methods attempt to rerank all the individual result videos, they suffer from several drawbacks. In this article, we propose a new video reranking paradigm called cluster-based video reranking (CVR). The idea is to first construct a video near-duplicate graph representing the visual similarity relationship among videos, followed by identifying the near-duplicate clusters from the video near-duplicate graph, then ranking the obtained near-duplicate clusters based on cluster properties and intercluster links, and finally for each ranked cluster, a representative video is selected and returned.", acknowledgement = ack-nhfb, articleno = "22", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Culpepper:2010:ESI, author = "J. Shane Culpepper and Alistair Moffat", title = "Efficient set intersection for inverted indexing", journal = j-TOIS, volume = "29", number = "1", pages = "1:1--1:??", month = dec, year = "2010", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1877766.1877767", ISSN = "1046-8188", bibdate = "Thu Dec 23 17:15:03 MST 2010", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Conjunctive Boolean queries are a key component of modern information retrieval systems, especially when Web-scale repositories are being searched. A conjunctive query q is equivalent to a $|q|$-way intersection over ordered sets of integers, where each set represents the documents containing one of the terms, and each integer in each set is an ordinal document identifier. As is the case with many computing applications, there is tension between the way in which the data is represented, and the ways in which it is to be manipulated. In particular, the sets representing index data for typical document collections are highly compressible, but are processed using random access techniques, meaning that methods for carrying out set intersections must be alert to issues to do with access patterns and data representation.", acknowledgement = ack-nhfb, articleno = "1", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Transier:2010:EBA, author = "Frederik Transier and Peter Sanders", title = "Engineering basic algorithms of an in-memory text search engine", journal = j-TOIS, volume = "29", number = "1", pages = "2:1--2:??", month = dec, year = "2010", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1877766.1877768", ISSN = "1046-8188", bibdate = "Thu Dec 23 17:15:03 MST 2010", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Inverted index data structures are the key to fast text search engines. We first investigate one of the predominant operation on inverted indexes, which asks for intersecting two sorted lists of document IDs of different lengths. We explore compression and performance of different inverted list data structures. In particular, we present Lookup, a new data structure that allows intersection in expected time linear in the smaller list. Based on this result, we present the algorithmic core of a full text data base that allows fast Boolean queries, phrase queries, and document reporting using less space than the input text. The system uses a carefully choreographed combination of classical data compression techniques and inverted-index-based search data structures.", acknowledgement = ack-nhfb, articleno = "2", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Krikon:2010:UIP, author = "Eyal Krikon and Oren Kurland and Michael Bendersky", title = "Utilizing inter-passage and inter-document similarities for reranking search results", journal = j-TOIS, volume = "29", number = "1", pages = "3:1--3:??", month = dec, year = "2010", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1877766.1877769", ISSN = "1046-8188", bibdate = "Thu Dec 23 17:15:03 MST 2010", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "We present a novel language-model-based approach to reranking search results; that is, reordering the documents in an initially retrieved list so as to improve precision at top ranks. Our model integrates whole-document information with that induced from passages. Specifically, inter-passage, inter-document, and query-based similarities, which constitute a rich source of information, are combined in our model. Empirical evaluation shows that the precision-at-top-ranks performance of our model is substantially better than that of the initial ranking upon which reranking is performed. Furthermore, the performance is substantially better than that of a commonly used passage-based document ranking method that does not exploit inter-item similarities.", acknowledgement = ack-nhfb, articleno = "3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Minkov:2010:IGW, author = "Einat Minkov and William W. Cohen", title = "Improving graph-walk-based similarity with reranking: {Case} studies for personal information management", journal = j-TOIS, volume = "29", number = "1", pages = "4:1--4:??", month = dec, year = "2010", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1877766.1877770", ISSN = "1046-8188", bibdate = "Thu Dec 23 17:15:03 MST 2010", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Relational or semistructured data is naturally represented by a graph, where nodes denote entities and directed typed edges represent the relations between them. Such graphs are heterogeneous, describing different types of objects and links. We represent personal information as a graph that includes messages, terms, persons, dates, and other object types, and relations like sent-to and has-term. Given the graph, we apply finite random graph walks to induce a measure of entity similarity, which can be viewed as a tool for performing search in the graph. Experiments conducted using personal email collections derived from the Enron corpus and other corpora show how the different tasks of alias finding, threading, and person name disambiguation can be all addressed as search queries in this framework, where the graph-walk-based similarity metric is preferable to alternative approaches, and further improvements are achieved with learning.", acknowledgement = ack-nhfb, articleno = "4", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{DellAmico:2010:DFP, author = "Matteo Dell'Amico and Licia Capra", title = "Dependable filtering: {Philosophy} and realizations", journal = j-TOIS, volume = "29", number = "1", pages = "5:1--5:??", month = dec, year = "2010", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1877766.1877771", ISSN = "1046-8188", bibdate = "Thu Dec 23 17:15:03 MST 2010", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Digital content production and distribution has radically changed our business models. An unprecedented volume of supply is now on offer, whetted by the demand of millions of users from all over the world. Since users cannot be expected to browse through millions of different items to find what they might like, filtering has become a popular technique to connect supply and demand: trusted users are first identified, and their opinions are then used to create recommendations. In this domain, users' trustworthiness has been measured according to one of the following two criteria: taste similarity (i.e., ``I trust those who agree with me''), or social ties (i.e., ``I trust my friends, and the people that my friends trust'').", acknowledgement = ack-nhfb, articleno = "5", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Choudhury:2010:ECU, author = "Munmun De Choudhury and Hari Sundaram and Ajita John and Doree Duncan Seligmann", title = "Extraction, characterization and utility of prototypical communication groups in the blogosphere", journal = j-TOIS, volume = "29", number = "1", pages = "6:1--6:??", month = dec, year = "2010", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1877766.1877772", ISSN = "1046-8188", bibdate = "Thu Dec 23 17:15:03 MST 2010", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "This article analyzes communication within a set of individuals to extract the representative prototypical groups and provides a novel framework to establish the utility of such groups. Corporations may want to identify representative groups (which are indicative of the overall communication set) because it is easier to track the prototypical groups rather than the entire set. This can be useful for advertising, identifying ``hot'' spots of resource consumption as well as in mining representative moods or temperature of a community. Our framework has three parts: extraction, characterization, and utility of prototypical groups. First, we extract groups by developing features representing communication dynamics of the individuals.", acknowledgement = ack-nhfb, articleno = "6", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Fang:2011:DEI, author = "Hui Fang and Tao Tao and Chengxiang Zhai", title = "Diagnostic Evaluation of Information Retrieval Models", journal = j-TOIS, volume = "29", number = "2", pages = "7:1--7:??", month = apr, year = "2011", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1961209.1961210", ISSN = "1046-8188", bibdate = "Tue May 3 17:57:26 MDT 2011", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Developing effective retrieval models is a long-standing central challenge in information retrieval research. In order to develop more effective models, it is necessary to understand the deficiencies of the current retrieval models and the relative strengths of each of them. In this article, we propose a general methodology to analytically and experimentally diagnose the weaknesses of a retrieval function, which provides guidance on how to further improve its performance. Our methodology is motivated by the empirical observation that good retrieval performance is closely related to the use of various retrieval heuristics. We connect the weaknesses and strengths of a retrieval function with its implementations of these retrieval heuristics, and propose two strategies to check how well a retrieval function implements the desired retrieval heuristics.", acknowledgement = ack-nhfb, articleno = "7", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Egozi:2011:CBI, author = "Ofer Egozi and Shaul Markovitch and Evgeniy Gabrilovich", title = "Concept-Based Information Retrieval Using Explicit Semantic Analysis", journal = j-TOIS, volume = "29", number = "2", pages = "8:1--8:??", month = apr, year = "2011", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1961209.1961211", ISSN = "1046-8188", bibdate = "Tue May 3 17:57:26 MDT 2011", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Information retrieval systems traditionally rely on textual keywords to index and retrieve documents. Keyword-based retrieval may return inaccurate and incomplete results when different keywords are used to describe the same concept in the documents and in the queries. Furthermore, the relationship between these related keywords may be semantic rather than syntactic, and capturing it thus requires access to comprehensive human world knowledge. Concept-based retrieval methods have attempted to tackle these difficulties by using manually built thesauri, by relying on term cooccurrence data, or by extracting latent word relationships and concepts from a corpus. In this article we introduce a new concept-based retrieval approach based on Explicit Semantic Analysis (ESA), a recently proposed method that augments keyword-based text representation with concept-based features, automatically extracted from massive human knowledge repositories such as Wikipedia.", acknowledgement = ack-nhfb, articleno = "8", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Ma:2011:IRS, author = "Hao Ma and Tom Chao Zhou and Michael R. Lyu and Irwin King", title = "Improving Recommender Systems by Incorporating Social Contextual Information", journal = j-TOIS, volume = "29", number = "2", pages = "9:1--9:??", month = apr, year = "2011", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1961209.1961212", ISSN = "1046-8188", bibdate = "Tue May 3 17:57:26 MDT 2011", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Due to their potential commercial value and the associated great research challenges, recommender systems have been extensively studied by both academia and industry recently. However, the data sparsity problem of the involved user-item matrix seriously affects the recommendation quality. Many existing approaches to recommender systems cannot easily deal with users who have made very few ratings. In view of the exponential growth of information generated by online users, social contextual information analysis is becoming important for many Web applications. In this article, we propose a factor analysis approach based on probabilistic matrix factorization to alleviate the data sparsity and poor prediction accuracy problems by incorporating social contextual information, such as social networks and social tags.", acknowledgement = ack-nhfb, articleno = "9", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Mei:2011:CVR, author = "Tao Mei and Bo Yang and Xian-Sheng Hua and Shipeng Li", title = "Contextual Video Recommendation by Multimodal Relevance and User Feedback", journal = j-TOIS, volume = "29", number = "2", pages = "10:1--10:??", month = apr, year = "2011", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1961209.1961213", ISSN = "1046-8188", bibdate = "Tue May 3 17:57:26 MDT 2011", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "With Internet delivery of video content surging to an unprecedented level, video recommendation, which suggests relevant videos to targeted users according to their historical and current viewings or preferences, has become one of most pervasive online video services. This article presents a novel contextual video recommendation system, called VideoReach, based on multimodal content relevance and user feedback. We consider an online video usually consists of different modalities (i.e., visual and audio track, as well as associated texts such as query, keywords, and surrounding text). Therefore, the recommended videos should be relevant to current viewing in terms of multimodal relevance. We also consider that different parts of videos are with different degrees of interest to a user, as well as different features and modalities have different contributions to the overall relevance.", acknowledgement = ack-nhfb, articleno = "10", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Vallet:2011:EUB, author = "David Vallet and Frank Hopfgartner and Joemon M. Jose and Pablo Castells", title = "Effects of Usage-Based Feedback on Video Retrieval: {A} Simulation-Based Study", journal = j-TOIS, volume = "29", number = "2", pages = "11:1--11:??", month = apr, year = "2011", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1961209.1961214", ISSN = "1046-8188", bibdate = "Tue May 3 17:57:26 MDT 2011", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "We present a model for exploiting community-based usage information for video retrieval, where implicit usage information from past users is exploited in order to provide enhanced assistance in video retrieval tasks, and alleviate the effects of the semantic gap problem. We propose a graph-based model for all types of implicit and explicit feedback, in which the relevant usage information is represented. Our model is designed to capture the complex interactions of a user with an interactive video retrieval system, including the representation of sequences of user-system interaction during a search session. Building upon this model, four recommendation strategies are defined and evaluated.", acknowledgement = ack-nhfb, articleno = "11", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Sun:2011:IIR, author = "Bingjun Sun and Prasenjit Mitra and C. Lee Giles and Karl T. Mueller", title = "Identifying, Indexing, and Ranking Chemical Formulae and Chemical Names in Digital Documents", journal = j-TOIS, volume = "29", number = "2", pages = "12:1--12:??", month = apr, year = "2011", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1961209.1961215", ISSN = "1046-8188", bibdate = "Tue May 3 17:57:26 MDT 2011", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "End-users utilize chemical search engines to search for chemical formulae and chemical names. Chemical search engines identify and index chemical formulae and chemical names appearing in text documents to support efficient search and retrieval in the future. Identifying chemical formulae and chemical names in text automatically has been a hard problem that has met with varying degrees of success in the past. We propose algorithms for chemical formula and chemical name tagging using Conditional Random Fields (CRFs) and Support Vector Machines (SVMs) that achieve higher accuracy than existing (published) methods. After chemical entities have been identified in text documents, they must be indexed.", acknowledgement = ack-nhfb, articleno = "12", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{SanPedro:2011:CRY, author = "Jose {San Pedro} and Stefan Siersdorfer and Mark Sanderson", title = "Content redundancy in {YouTube} and its application to video tagging", journal = j-TOIS, volume = "29", number = "3", pages = "13:1--13:??", month = jul, year = "2011", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1993036.1993037", ISSN = "1046-8188", bibdate = "Tue Jul 19 18:04:21 MDT 2011", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The emergence of large-scale social Web communities has enabled users to share online vast amounts of multimedia content. An analysis of YouTube reveals a high amount of redundancy, in the form of videos with overlapping or duplicated content. We use robust content-based video analysis techniques to detect overlapping sequences between videos. Based on the output of these techniques, we present an in-depth study of duplication and content overlap in YouTube, and analyze various dependencies between content overlap and meta data such as video titles, views, video ratings, and tags. As an application, we show that content-based links provide useful information for generating new tag assignments.", acknowledgement = ack-nhfb, articleno = "13", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Schedl:2011:EMS, author = "Markus Schedl and Tim Pohle and Peter Knees and Gerhard Widmer", title = "Exploring the music similarity space on the {Web}", journal = j-TOIS, volume = "29", number = "3", pages = "14:1--14:??", month = jul, year = "2011", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1993036.1993038", ISSN = "1046-8188", bibdate = "Tue Jul 19 18:04:21 MDT 2011", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "This article comprehensively addresses the problem of similarity measurement between music artists via text-based features extracted from Web pages. To this end, we present a thorough evaluation of different term-weighting strategies, normalization methods, aggregation functions, and similarity measurement techniques. In large-scale genre classification experiments carried out on real-world artist collections, we analyze several thousand combinations of settings/parameters that influence the similarity calculation process, and investigate in which way they impact the quality of the similarity estimates. Accurate similarity measures for music are vital for many applications, such as automated playlist generation, music recommender systems, music information systems, or intelligent user interfaces to access music collections by means beyond text-based browsing.", acknowledgement = ack-nhfb, articleno = "14", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Yan:2011:TSG, author = "Xin Yan and Raymond Y. K. Lau and Dawei Song and Xue Li and Jian Ma", title = "Toward a semantic granularity model for domain-specific information retrieval", journal = j-TOIS, volume = "29", number = "3", pages = "15:1--15:??", month = jul, year = "2011", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1993036.1993039", ISSN = "1046-8188", bibdate = "Tue Jul 19 18:04:21 MDT 2011", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Both similarity-based and popularity-based document ranking functions have been successfully applied to information retrieval (IR) in general. However, the dimension of semantic granularity also should be considered for effective retrieval. In this article, we propose a semantic granularity-based IR model that takes into account the three dimensions, namely similarity, popularity, and semantic granularity, to improve domain-specific search. In particular, a concept-based computational model is developed to estimate the semantic granularity of documents with reference to a domain ontology. Semantic granularity refers to the levels of semantic detail carried by an information item. The results of our benchmark experiments confirm that the proposed semantic granularity based IR model performs significantly better than the similarity-based baseline in both a bio-medical and an agricultural domain.", acknowledgement = ack-nhfb, articleno = "15", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Bast:2011:FCH, author = "Hannah Bast and Marjan Celikik", title = "Fast construction of the {HYB} index", journal = j-TOIS, volume = "29", number = "3", pages = "16:1--16:??", month = jul, year = "2011", CODEN = "ATISET", DOI = "https://doi.org/10.1145/1993036.1993040", ISSN = "1046-8188", bibdate = "Tue Jul 19 18:04:21 MDT 2011", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "As shown in a series of recent works, the HYB index is an alternative to the inverted index (INV) that enables very fast prefix searches, which in turn is the basis for fast processing of many other types of advanced queries, including autocompletion, faceted search, error-tolerant search, database-style select and join, and semantic search. In this work we show that HYB can be constructed at least as fast as INV, and often up to twice as fast. This is because HYB, by its nature, requires only a half-inversion of the data and allows an efficient in-place instead of the traditional merge-based index construction.", acknowledgement = ack-nhfb, articleno = "16", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Macdonald:2011:UBA, author = "Craig Macdonald and Iadh Ounis and Nicola Tonellotto", title = "Upper-bound approximations for dynamic pruning", journal = j-TOIS, volume = "29", number = "4", pages = "17:1--17:??", month = dec, year = "2011", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2037661.2037662", ISSN = "1046-8188", bibdate = "Thu Dec 15 09:18:39 MST 2011", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Dynamic pruning strategies for information retrieval systems can increase querying efficiency without decreasing effectiveness by using upper bounds to safely omit scoring documents that are unlikely to make the final retrieved set. Often, such upper bounds are pre-calculated at indexing time for a given weighting model. However, this precludes changing, adapting or training the weighting model without recalculating the upper bounds. Instead, upper bounds should be approximated at querying time from various statistics of each term to allow on-the-fly adaptation of the applied retrieval strategy. This article, by using uniform notation, formulates the problem of determining a term upper-bound given a weighting model and discusses the limitations of existing approximations.", acknowledgement = ack-nhfb, articleno = "17", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Chen:2011:RFA, author = "Keke Chen and Jing Bai and Zhaohui Zheng", title = "Ranking function adaptation with boosting trees", journal = j-TOIS, volume = "29", number = "4", pages = "18:1--18:??", month = dec, year = "2011", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2037661.2037663", ISSN = "1046-8188", bibdate = "Thu Dec 15 09:18:39 MST 2011", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Machine-learned ranking functions have shown successes in Web search engines. With the increasing demands on developing effective ranking functions for different search domains, we have seen a big bottleneck, that is, the problem of insufficient labeled training data, which has significantly slowed the development and deployment of machine-learned ranking functions for different domains. There are two possible approaches to address this problem: (1) combining labeled training data from similar domains with the small target-domain labeled data for training or (2) using pairwise preference data extracted from user clickthrough log for the target domain for training. In this article, we propose a new approach called tree-based ranking function adaptation (Trada) to effectively utilize these data sources for training cross-domain ranking functions.", acknowledgement = ack-nhfb, articleno = "18", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Paik:2011:GEE, author = "Jiaul H. Paik and Mandar Mitra and Swapan K. Parui and Kalervo J{\"a}rvelin", title = "{GRAS}: an effective and efficient stemming algorithm for information retrieval", journal = j-TOIS, volume = "29", number = "4", pages = "19:1--19:??", month = dec, year = "2011", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2037661.2037664", ISSN = "1046-8188", bibdate = "Thu Dec 15 09:18:39 MST 2011", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "A novel graph-based language-independent stemming algorithm suitable for information retrieval is proposed in this article. The main features of the algorithm are retrieval effectiveness, generality, and computational efficiency. We test our approach on seven languages (using collections from the TREC, CLEF, and FIRE evaluation platforms) of varying morphological complexity. Significant performance improvement over plain word-based retrieval, three other language-independent morphological normalizers, as well as rule-based stemmers is demonstrated.", acknowledgement = ack-nhfb, articleno = "19", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Parameswaran:2011:RSC, author = "Aditya Parameswaran and Petros Venetis and Hector Garcia-Molina", title = "Recommendation systems with complex constraints: a course recommendation perspective", journal = j-TOIS, volume = "29", number = "4", pages = "20:1--20:??", month = dec, year = "2011", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2037661.2037665", ISSN = "1046-8188", bibdate = "Thu Dec 15 09:18:39 MST 2011", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "We study the problem of making recommendations when the objects to be recommended must also satisfy constraints or requirements. In particular, we focus on course recommendations: the courses taken by a student must satisfy requirements (e.g., take two out of a set of five math courses) in order for the student to graduate. Our work is done in the context of the CourseRank system, used by students to plan their academic program at Stanford University. Our goal is to recommend to these students courses that not only help satisfy constraints, but that are also desirable (e.g., popular or taken by similar students).", acknowledgement = ack-nhfb, articleno = "20", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Liu:2011:CBR, author = "Jiajun Liu and Zi Huang and Heng Tao Shen and Bin Cui", title = "Correlation-based retrieval for heavily changed near-duplicate videos", journal = j-TOIS, volume = "29", number = "4", pages = "21:1--21:??", month = dec, year = "2011", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2037661.2037666", ISSN = "1046-8188", bibdate = "Thu Dec 15 09:18:39 MST 2011", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The unprecedented and ever-growing number of Web videos nowadays leads to the massive existence of near-duplicate videos. Very often, some near-duplicate videos exhibit great content changes, while the user perceives little information change, for example, color features change significantly when transforming a color video with a blue filter. These feature changes contribute to low-level video similarity computations, making conventional similarity-based near-duplicate video retrieval techniques incapable of accurately capturing the implicit relationship between two near-duplicate videos with fairly large content modifications. In this paper, we introduce a new dimension for near-duplicate video retrieval. Different from existing near-duplicate video retrieval approaches which are based on video-content similarity, we explore the correlation between two videos.", acknowledgement = ack-nhfb, articleno = "21", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Balog:2011:QME, author = "Krisztian Balog and Marc Bron and Maarten {De Rijke}", title = "Query modeling for entity search based on terms, categories, and examples", journal = j-TOIS, volume = "29", number = "4", pages = "22:1--22:??", month = dec, year = "2011", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2037661.2037667", ISSN = "1046-8188", bibdate = "Thu Dec 15 09:18:39 MST 2011", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Users often search for entities instead of documents, and in this setting, are willing to provide extra input, in addition to a series of query terms, such as category information and example entities. We propose a general probabilistic framework for entity search to evaluate and provide insights in the many ways of using these types of input for query modeling. We focus on the use of category information and show the advantage of a category-based representation over a term-based representation, and also demonstrate the effectiveness of category-based expansion using example entities.", acknowledgement = ack-nhfb, articleno = "22", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Farina:2012:WBS, author = "Antonio Fari{\~n}a and Nieves R. Brisaboa and Gonzalo Navarro and Francisco Claude and {\'A}ngeles S. Places and Eduardo Rodr{\'\i}guez", title = "Word-based self-indexes for natural language text", journal = j-TOIS, volume = "30", number = "1", pages = "1:1--1:??", month = feb, year = "2012", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2094072.2094073", ISSN = "1046-8188", bibdate = "Wed Feb 29 16:22:15 MST 2012", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The inverted index supports efficient full-text searches on natural language text collections. It requires some extra space over the compressed text that can be traded for search speed. It is usually fast for single-word searches, yet phrase searches require more expensive intersections. In this article we introduce a different kind of index. It replaces the text using essentially the same space required by the compressed text alone (compression ratio around 35\%). Within this space it supports not only decompression of arbitrary passages, but efficient word and phrase searches. Searches are orders of magnitude faster than those over inverted indexes when looking for phrases, and still faster on single-word searches when little space is available.", acknowledgement = ack-nhfb, articleno = "1", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Altingovde:2012:SIP, author = "Ismail S. Altingovde and Rifat Ozcan and {\"O}zg{\"u}r Ulusoy", title = "Static index pruning in {Web} search engines: Combining term and document popularities with query views", journal = j-TOIS, volume = "30", number = "1", pages = "2:1--2:??", month = feb, year = "2012", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2094072.2094074", ISSN = "1046-8188", bibdate = "Wed Feb 29 16:22:15 MST 2012", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Static index pruning techniques permanently remove a presumably redundant part of an inverted file, to reduce the file size and query processing time. These techniques differ in deciding which parts of an index can be removed safely; that is, without changing the top-ranked query results. As defined in the literature, the query view of a document is the set of query terms that access to this particular document, that is, retrieves this document among its top results. In this paper, we first propose using query views to improve the quality of the top results compared against the original results. We incorporate query views in a number of static pruning strategies, namely term-centric, document-centric, term popularity based and document access popularity based approaches, and show that the new strategies considerably outperform their counterparts especially for the higher levels of pruning and for both disjunctive and conjunctive query processing.", acknowledgement = ack-nhfb, articleno = "2", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Bhatia:2012:SFT, author = "Sumit Bhatia and Prasenjit Mitra", title = "Summarizing figures, tables, and algorithms in scientific publications to augment search results", journal = j-TOIS, volume = "30", number = "1", pages = "3:1--3:??", month = feb, year = "2012", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2094072.2094075", ISSN = "1046-8188", bibdate = "Wed Feb 29 16:22:15 MST 2012", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Increasingly, special-purpose search engines are being built to enable the retrieval of document-elements like tables, figures, and algorithms [Bhatia et al. 2010; Liu et al. 2007; Hearst et al. 2007]. These search engines present a thumbnail view of document-elements, some document metadata such as the title of the papers and their authors, and the caption of the document-element. While some authors in some disciplines write carefully tailored captions, generally, the author of a document assumes that the caption will be read in the context of the text in the document. When the caption is presented out of context as in a document-element-search-engine result, it may not contain enough information to help the end-user understand what the content of the document-element is.", acknowledgement = ack-nhfb, articleno = "3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Carterette:2012:MTS, author = "Benjamin A. Carterette", title = "Multiple testing in statistical analysis of systems-based information retrieval experiments", journal = j-TOIS, volume = "30", number = "1", pages = "4:1--4:??", month = feb, year = "2012", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2094072.2094076", ISSN = "1046-8188", bibdate = "Wed Feb 29 16:22:15 MST 2012", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "High-quality reusable test collections and formal statistical hypothesis testing together support a rigorous experimental environment for information retrieval research. But as Armstrong et al. [2009b] recently argued, global analysis of experiments suggests that there has actually been little real improvement in ad hoc retrieval effectiveness over time. We investigate this phenomenon in the context of simultaneous testing of many hypotheses using a fixed set of data. We argue that the most common approaches to significance testing ignore a great deal of information about the world. Taking into account even a fairly small amount of this information can lead to very different conclusions about systems than those that have appeared in published literature.", acknowledgement = ack-nhfb, articleno = "4", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Broschart:2012:HPP, author = "Andreas Broschart and Ralf Schenkel", title = "High-performance processing of text queries with tunable pruned term and term pair indexes", journal = j-TOIS, volume = "30", number = "1", pages = "5:1--5:??", month = feb, year = "2012", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2094072.2094077", ISSN = "1046-8188", bibdate = "Wed Feb 29 16:22:15 MST 2012", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Term proximity scoring is an established means in information retrieval for improving result quality of full-text queries. Integrating such proximity scores into efficient query processing, however, has not been equally well studied. Existing methods make use of precomputed lists of documents where tuples of terms, usually pairs, occur together, usually incurring a huge index size compared to term-only indexes. This article introduces a joint framework for trading off index size and result quality, and provides optimization techniques for tuning precomputed indexes towards either maximal result quality or maximal query processing performance under controlled result quality, given an upper bound for the index size.", acknowledgement = ack-nhfb, articleno = "5", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Chapelle:2012:LSV, author = "Olivier Chapelle and Thorsten Joachims and Filip Radlinski and Yisong Yue", title = "Large-scale validation and analysis of interleaved search evaluation", journal = j-TOIS, volume = "30", number = "1", pages = "6:1--6:??", month = feb, year = "2012", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2094072.2094078", ISSN = "1046-8188", bibdate = "Wed Feb 29 16:22:15 MST 2012", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Interleaving is an increasingly popular technique for evaluating information retrieval systems based on implicit user feedback. While a number of isolated studies have analyzed how this technique agrees with conventional offline evaluation approaches and other online techniques, a complete picture of its efficiency and effectiveness is still lacking. In this paper we extend and combine the body of empirical evidence regarding interleaving, and provide a comprehensive analysis of interleaving using data from two major commercial search engines and a retrieval system for scientific literature. In particular, we analyze the agreement of interleaving with manual relevance judgments and observational implicit feedback measures, estimate the statistical efficiency of interleaving, and explore the relative performance of different interleaving variants.", acknowledgement = ack-nhfb, articleno = "6", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Cao:2012:AEC, author = "Xin Cao and Gao Cong and Bin Cui and Christian S. Jensen and Quan Yuan", title = "Approaches to Exploring Category Information for Question Retrieval in Community Question-Answer Archives", journal = j-TOIS, volume = "30", number = "2", pages = "7:1--7:??", month = may, year = "2012", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2180868.2180869", ISSN = "1046-8188", bibdate = "Wed May 23 17:07:22 MDT 2012", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Community Question Answering (CQA) is a popular type of service where users ask questions and where answers are obtained from other users or from historical question-answer pairs. CQA archives contain large volumes of questions organized into a hierarchy of categories. As an essential function of CQA services, question retrieval in a CQA archive aims to retrieve historical question-answer pairs that are relevant to a query question. This article presents several new approaches to exploiting the category information of questions for improving the performance of question retrieval, and it applies these approaches to existing question retrieval models, including a state-of-the-art question retrieval model. Experiments conducted on real CQA data demonstrate that the proposed techniques are effective and efficient and are capable of outperforming a variety of baseline methods significantly.", acknowledgement = ack-nhfb, articleno = "7", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Miotto:2012:PMC, author = "Riccardo Miotto and Nicola Orio", title = "A Probabilistic Model to Combine Tags and Acoustic Similarity for Music Retrieval", journal = j-TOIS, volume = "30", number = "2", pages = "8:1--8:??", month = may, year = "2012", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2180868.2180870", ISSN = "1046-8188", bibdate = "Wed May 23 17:07:22 MDT 2012", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The rise of the Internet has led the music industry to a transition from physical media to online products and services. As a consequence, current online music collections store millions of songs and are constantly being enriched with new content. This has created a need for music technologies that allow users to interact with these extensive collections efficiently and effectively. Music search and discovery may be carried out using tags, matching user interests and exploiting content-based acoustic similarity. One major issue in music information retrieval is how to combine such noisy and heterogeneous information sources in order to improve retrieval effectiveness. With this aim in mind, the article explores a novel music retrieval framework based on combining tags and acoustic similarity through a probabilistic graph-based representation of a collection of songs. The retrieval function highlights the path across the graph that most likely observes a user query and is used to improve state-of-the-art music search and discovery engines by delivering more relevant ranking lists. Indeed, by means of an empirical evaluation, we show how the proposed approach leads to better performances than retrieval strategies which rank songs according to individual information sources alone or which use a combination of them.", acknowledgement = ack-nhfb, articleno = "8", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Tigelaar:2012:PPI, author = "Almer S. Tigelaar and Djoerd Hiemstra and Dolf Trieschnigg", title = "Peer-to-Peer Information Retrieval: An Overview", journal = j-TOIS, volume = "30", number = "2", pages = "9:1--9:??", month = may, year = "2012", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2180868.2180871", ISSN = "1046-8188", bibdate = "Wed May 23 17:07:22 MDT 2012", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Peer-to-peer technology is widely used for file sharing. In the past decade a number of prototype peer-to-peer information retrieval systems have been developed. Unfortunately, none of these has seen widespread real-world adoption and thus, in contrast with file sharing, information retrieval is still dominated by centralized solutions. In this article we provide an overview of the key challenges for peer-to-peer information retrieval and the work done so far. We want to stimulate and inspire further research to overcome these challenges. This will open the door to the development and large-scale deployment of real-world peer-to-peer information retrieval systems that rival existing centralized client-server solutions in terms of scalability, performance, user satisfaction, and freedom.", acknowledgement = ack-nhfb, articleno = "9", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Pal:2012:EQS, author = "Aditya Pal and F. Maxwell Harper and Joseph A. Konstan", title = "Exploring Question Selection Bias to Identify Experts and Potential Experts in Community Question Answering", journal = j-TOIS, volume = "30", number = "2", pages = "10:1--10:??", month = may, year = "2012", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2180868.2180872", ISSN = "1046-8188", bibdate = "Wed May 23 17:07:22 MDT 2012", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Community Question Answering (CQA) services enable their users to exchange knowledge in the form of questions and answers. These communities thrive as a result of a small number of highly active users, typically called experts, who provide a large number of high-quality useful answers. Expert identification techniques enable community managers to take measures to retain the experts in the community. There is further value in identifying the experts during the first few weeks of their participation as it would allow measures to nurture and retain them. In this article we address two problems: (a) How to identify current experts in CQA? and (b) How to identify users who have potential of becoming experts in future (potential experts)? In particular, we propose a probabilistic model that captures the selection preferences of users based on the questions they choose for answering. The probabilistic model allows us to run machine learning methods for identifying experts and potential experts. Our results over several popular CQA datasets indicate that experts differ considerably from ordinary users in their selection preferences; enabling us to predict experts with higher accuracy over several baseline models. We show that selection preferences can be combined with baseline measures to improve the predictive performance even further.", acknowledgement = ack-nhfb, articleno = "10", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Shtok:2012:PQP, author = "Anna Shtok and Oren Kurland and David Carmel and Fiana Raiber and Gad Markovits", title = "Predicting Query Performance by Query-Drift Estimation", journal = j-TOIS, volume = "30", number = "2", pages = "11:1--11:??", month = may, year = "2012", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2180868.2180873", ISSN = "1046-8188", bibdate = "Wed May 23 17:07:22 MDT 2012", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Predicting query performance, that is, the effectiveness of a search performed in response to a query, is a highly important and challenging problem. We present a novel approach to this task that is based on measuring the standard deviation of retrieval scores in the result list of the documents most highly ranked. We argue that for retrieval methods that are based on document-query surface-level similarities, the standard deviation can serve as a surrogate for estimating the presumed amount of query drift in the result list, that is, the presence (and dominance) of aspects or topics not related to the query in documents in the list. Empirical evaluation demonstrates the prediction effectiveness of our approach for several retrieval models. Specifically, the prediction quality often transcends that of current state-of-the-art prediction methods.", acknowledgement = ack-nhfb, articleno = "11", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Savoy:2012:AAB, author = "Jacques Savoy", title = "Authorship Attribution Based on Specific Vocabulary", journal = j-TOIS, volume = "30", number = "2", pages = "12:1--12:??", month = may, year = "2012", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2180868.2180874", ISSN = "1046-8188", bibdate = "Wed May 23 17:07:22 MDT 2012", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "In this article we propose a technique for computing a standardized Z score capable of defining the specific vocabulary found in a text (or part thereof) compared to that of an entire corpus. Assuming that the term occurrence follows a binomial distribution, this method is then applied to weight terms (words and punctuation symbols in the current study), representing the lexical specificity of the underlying text. In a final stage, to define an author profile we suggest averaging these text representations and then applying them along with a distance measure to derive a simple and efficient authorship attribution scheme. To evaluate this algorithm and demonstrate its effectiveness, we develop two experiments, the first based on 5,408 newspaper articles ( Glasgow Herald ) written in English by 20 distinct authors and the second on 4,326 newspaper articles ( La Stampa ) written in Italian by 20 distinct authors. These experiments demonstrate that the suggested classification scheme tends to perform better than the Delta rule method based on the most frequent words, better than the chi-square distance based on word profiles and punctuation marks, better than the KLD scheme based on a predefined set of words, and better than the na{\"\i}ve Bayes approach.", acknowledgement = ack-nhfb, articleno = "12", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Nie:2012:OIS, author = "Liqiang Nie and Meng Wang and Zheng-Jun Zha and Tat-Seng Chua", title = "Oracle in Image Search: a Content-Based Approach to Performance Prediction", journal = j-TOIS, volume = "30", number = "2", pages = "13:1--13:??", month = may, year = "2012", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2180868.2180875", ISSN = "1046-8188", bibdate = "Wed May 23 17:07:22 MDT 2012", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "This article studies a novel problem in image search. Given a text query and the image ranking list returned by an image search system, we propose an approach to automatically predict the search performance. We demonstrate that, in order to estimate the mathematical expectations of Average Precision (AP) and Normalized Discounted Cumulative Gain (NDCG), we only need to predict the relevance probability of each image. We accomplish the task with a query-adaptive graph-based learning based on the images' ranking order and visual content. We validate our approach with a large-scale dataset that contains the image search results of 1,165 queries from 4 popular image search engines. Empirical studies demonstrate that our approach is able to generate predictions that are highly correlated with the real search performance. Based on the proposed image search performance prediction scheme, we introduce three applications: image metasearch, multilingual image search, and Boolean image search. Comprehensive experiments are conducted to validate our approach.", acknowledgement = ack-nhfb, articleno = "13", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Guttenbrunner:2012:MFE, author = "Mark Guttenbrunner and Andreas Rauber", title = "A Measurement Framework for Evaluating Emulators for Digital Preservation", journal = j-TOIS, volume = "30", number = "2", pages = "14:1--14:??", month = may, year = "2012", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2180868.2180876", ISSN = "1046-8188", bibdate = "Wed May 23 17:07:22 MDT 2012", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Accessible emulation is often the method of choice for maintaining digital objects, specifically complex ones such as applications, business processes, or electronic art. However, validating the emulator's ability to faithfully reproduce the original behavior of digital objects is complicated. This article presents an evaluation framework and a set of tests that allow assessment of the degree to which system emulation preserves original characteristics and thus significant properties of digital artifacts. The original system, hardware, and software properties are described. Identical environment is then recreated via emulation. Automated user input is used to eliminate potential confounders. The properties of a rendered form of the object are then extracted automatically or manually either in a target state, a series of states, or as a continuous stream. The concepts described in this article enable preservation planners to evaluate how emulation affects the behavior of digital objects compared to their behavior in the original environment. We also review how these principles can and should be applied to the evaluation of migration and other preservation strategies as a general principle of evaluating the invocation and faithful rendering of digital objects and systems. The article concludes with design requirements for emulators developed for digital preservation tasks.", acknowledgement = ack-nhfb, articleno = "14", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Larson:2012:SIS, author = "Martha Larson and Franciska de Jong and Wessel Kraaij and Steve Renals", title = "Special issue on searching speech", journal = j-TOIS, volume = "30", number = "3", pages = "15:1--15:??", month = aug, year = "2012", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2328967.2328968", ISSN = "1046-8188", bibdate = "Thu Sep 6 09:43:05 MDT 2012", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, articleno = "15", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Wang:2012:DPC, author = "Dong Wang and Simon King and Joe Frankel and Ravichander Vipperla and Nicholas Evans and Rapha{\"e}l Troncy", title = "Direct posterior confidence for out-of-vocabulary spoken term detection", journal = j-TOIS, volume = "30", number = "3", pages = "16:1--16:??", month = aug, year = "2012", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2328967.2328969", ISSN = "1046-8188", bibdate = "Thu Sep 6 09:43:05 MDT 2012", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Spoken term detection (STD) is a key technology for spoken information retrieval. As compared to the conventional speech transcription and keyword spotting, STD is an open-vocabulary task and has to address out-of-vocabulary (OOV) terms. Approaches based on subword units, for example phones, are widely used to solve the OOV issue; however, performance on OOV terms is still substantially inferior to that of in-vocabulary (INV) terms. The performance degradation on OOV terms can be attributed to a multitude of factors. One particular factor we address in this article is the unreliable confidence estimation caused by weak acoustic and language modeling due to the absence of OOV terms in the training corpora. We propose a direct posterior confidence derived from a discriminative model, such as multilayer perceptron (MLP). The new confidence considers a wide-range acoustic context which is usually important for speech recognition and retrieval; moreover, it localizes on detected speech segments and therefore avoids the impact of long-span word context which is usually unreliable for OOV term detection. In this article, we first develop an extensive discussion about the modeling weakness problem associated with OOV terms, and then propose our approach to address this problem based on direct poster confidence. Our experiments carried out on spontaneous and conversational multiparty meeting speech, demonstrate that the proposed technique provides a significant improvement in STD performance as compared to conventional lattice-based confidence, in particular for OOV terms. Furthermore, the new confidence estimation approach is fused with other advanced techniques for OOV treatment, such as stochastic pronunciation modeling and discriminative confidence normalization. This leads to an integrated solution for OOV term detection that results in a large performance improvement.", acknowledgement = ack-nhfb, articleno = "16", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Luz:2012:NSP, author = "Saturnino Luz", title = "The nonverbal structure of patient case discussions in multidisciplinary medical team meetings", journal = j-TOIS, volume = "30", number = "3", pages = "17:1--17:??", month = aug, year = "2012", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2328967.2328970", ISSN = "1046-8188", bibdate = "Thu Sep 6 09:43:05 MDT 2012", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Meeting analysis has a long theoretical tradition in social psychology, with established practical ramifications in computer science, especially in computer supported cooperative work. More recently, a good deal of research has focused on the issues of indexing and browsing multimedia records of meetings. Most research in this area, however, is still based on data collected in laboratories, under somewhat artificial conditions. This article presents an analysis of the discourse structure and spontaneous interactions at real-life multidisciplinary medical team meetings held as part of the work routine in a major hospital. It is hypothesized that the conversational structure of these meetings, as indicated by sequencing and duration of vocalizations, enables segmentation into individual patient case discussions. The task of segmenting audio-visual records of multidisciplinary medical team meetings is described as a topic segmentation task, and a method for automatic segmentation is proposed. An empirical evaluation based on hand labelled data is presented, which determines the optimal length of vocalization sequences for segmentation, and establishes the competitiveness of the method with approaches based on more complex knowledge sources. The effectiveness of Bayesian classification as a segmentation method, and its applicability to meeting segmentation in other domains are discussed.", acknowledgement = ack-nhfb, articleno = "17", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Tejedor:2012:CML, author = "Javier Tejedor and Michal Fapso and Igor Sz{\"o}ke and Jan `Honza' Cernock{\'y} and Frantisek Gr{\'e}zl", title = "Comparison of methods for language-dependent and language-independent query-by-example spoken term detection", journal = j-TOIS, volume = "30", number = "3", pages = "18:1--18:??", month = aug, year = "2012", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2328967.2328971", ISSN = "1046-8188", bibdate = "Thu Sep 6 09:43:05 MDT 2012", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "This article investigates query-by-example (QbE) spoken term detection (STD), in which the query is not entered as text, but selected in speech data or spoken. Two feature extractors based on neural networks (NN) are introduced: the first producing phone-state posteriors and the second making use of a compressive NN layer. They are combined with three different QbE detectors: while the Gaussian mixture model/hidden Markov model (GMM/HMM) and dynamic time warping (DTW) both work on continuous feature vectors, the third one, based on weighted finite-state transducers (WFST), processes phone lattices. QbE STD is compared to two standard STD systems with text queries: acoustic keyword spotting and WFST-based search of phone strings in phone lattices. The results are reported on four languages (Czech, English, Hungarian, and Levantine Arabic) using standard metrics: equal error rate (EER) and two versions of popular figure-of-merit (FOM). Language-dependent and language-independent cases are investigated; the latter being particularly interesting for scenarios lacking standard resources to train speech recognition systems. While the DTW and GMM/HMM approaches produce the best results for a language-dependent setup depending on the target language, the GMM/HMM approach performs the best dealing with a language-independent setup. As far as WFSTs are concerned, they are promising as they allow for indexing and fast search.", acknowledgement = ack-nhfb, articleno = "18", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Comas:2012:SFQ, author = "Pere R. Comas and Jordi Turmo and Llu{\'\i}s M{\`a}rquez", title = "{Sibyl}, a factoid question-answering system for spoken documents", journal = j-TOIS, volume = "30", number = "3", pages = "19:1--19:??", month = aug, year = "2012", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2328967.2328972", ISSN = "1046-8188", bibdate = "Thu Sep 6 09:43:05 MDT 2012", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "In this article, we present a factoid question-answering system, Sibyl, specifically tailored for question answering (QA) on spoken-word documents. This work explores, for the first time, which techniques can be robustly adapted from the usual QA on written documents to the more difficult spoken document scenario. More specifically, we study new information retrieval (IR) techniques designed or speech, and utilize several levels of linguistic information for the speech-based QA task. These include named-entity detection with phonetic information, syntactic parsing applied to speech transcripts, and the use of coreference resolution. Sibyl is largely based on supervised machine-learning techniques, with special focus on the answer extraction step, and makes little use of handcrafted knowledge. Consequently, it should be easily adaptable to other domains and languages. Sibyl and all its modules are extensively evaluated on the European Parliament Plenary Sessions English corpus, comparing manual with automatic transcripts obtained by three different automatic speech recognition (ASR) systems that exhibit significantly different word error rates. This data belongs to the CLEF 2009 track for QA on speech transcripts. The main results confirm that syntactic information is very useful for learning to rank question candidates, improving results on both manual and automatic transcripts, unless the ASR quality is very low. At the same time, our experiments on coreference resolution reveal that the state-of-the-art technology is not mature enough to be effectively exploited for QA with spoken documents. Overall, the performance of Sibyl is comparable or better than the state-of-the-art on this corpus, confirming the validity of our approach.", acknowledgement = ack-nhfb, articleno = "19", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Moon:2012:OLF, author = "Taesup Moon and Wei Chu and Lihong Li and Zhaohui Zheng and Yi Chang", title = "An Online Learning Framework for Refining Recency Search Results with User Click Feedback", journal = j-TOIS, volume = "30", number = "4", pages = "20:1--20:??", month = nov, year = "2012", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2382438.2382439", ISSN = "1046-8188", bibdate = "Tue Nov 27 17:48:53 MST 2012", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Traditional machine-learned ranking systems for Web search are often trained to capture stationary relevance of documents to queries, which have limited ability to track nonstationary user intention in a timely manner. In recency search, for instance, the relevance of documents to a query on breaking news often changes significantly over time, requiring effective adaptation to user intention. In this article, we focus on recency search and study a number of algorithms to improve ranking results by leveraging user click feedback. Our contributions are threefold. First, we use commercial search engine sessions collected in a random exploration bucket for reliable offline evaluation of these algorithms, which provides an unbiased comparison across algorithms without online bucket tests. Second, we propose an online learning approach that reranks and improves the search results for recency queries near real-time based on user clicks. This approach is very general and can be combined with sophisticated click models. Third, our empirical comparison of a dozen algorithms on real-world search data suggests importance of a few algorithmic choices in these applications, including generalization across different query-document pairs, specialization to popular queries, and near real-time adaptation of user clicks for reranking.", acknowledgement = ack-nhfb, articleno = "20", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Liu:2012:DTT, author = "Hongyan Liu and Jun He and Yingqin Gu and Hui Xiong and Xiaoyong Du", title = "Detecting and Tracking Topics and Events from {Web} Search Logs", journal = j-TOIS, volume = "30", number = "4", pages = "21:1--21:??", month = nov, year = "2012", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2382438.2382440", ISSN = "1046-8188", bibdate = "Tue Nov 27 17:48:53 MST 2012", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Recent years have witnessed increased efforts on detecting topics and events from Web search logs, since this kind of data not only capture web content but also reflect the users' activities. However, the majority of existing work is focused on exploiting clustering techniques for topic and event detection. Due to the huge size and the evolving nature of Web data, existing clustering approaches are limited to meet the real-time demand. To that end, in this article, we propose a method called LETD to detect evolving topics in a timely manner. Also, we design the techniques to extract events from topics and to infer the evolving relationship among the events. For topic detection, we first provide a measurement to select the important URLs, which are most likely to describe a real-life topic. Then, starting from these selected URLs, we exploit the local expansion method to find other topic-related URLs. Moreover, in the LETD framework, we design algorithms based on Random Walk and Markov Random Fields (MRF), respectively. Because the LETD method exploits a divide-and-conquer strategy to process the data, it is more efficient than existing methods based on clustering techniques. To better illustrate the LETD framework, we develop a demo system StoryTeller which can discover hot topics and events, infer the evolving relationships among events, and visualize information in a storytelling way. This demo system can provide a global view of the topic development and help users target the interesting events more conveniently. Finally, experimental results on real-world Microsoft click-through data have shown that StoryTeller can find real-life hot topics and meaningful evolving relationships among events, and has also demonstrated the efficiency and effectiveness of the LETD method.", acknowledgement = ack-nhfb, articleno = "21", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Abbasi:2012:DFM, author = "Ahmed Abbasi and Fatemeh `Mariam' Zahedi and Siddharth Kaza", title = "Detecting Fake Medical {Web} Sites Using Recursive Trust Labeling", journal = j-TOIS, volume = "30", number = "4", pages = "22:1--22:??", month = nov, year = "2012", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2382438.2382441", ISSN = "1046-8188", bibdate = "Tue Nov 27 17:48:53 MST 2012", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Fake medical Web sites have become increasingly prevalent. Consequently, much of the health-related information and advice available online is inaccurate and/or misleading. Scores of medical institution Web sites are for organizations that do not exist and more than 90\% of online pharmacy Web sites are fraudulent. In addition to monetary losses exacted on unsuspecting users, these fake medical Web sites have severe public safety ramifications. According to a World Health Organization report, approximately half the drugs sold on the Web are counterfeit, resulting in thousands of deaths. In this study, we propose an adaptive learning algorithm called recursive trust labeling (RTL). RTL uses underlying content and graph-based classifiers, coupled with a recursive labeling mechanism, for enhanced detection of fake medical Web sites. The proposed method was evaluated on a test bed encompassing nearly 100 million links between 930,000 Web sites, including 1,000 known legitimate and fake medical sites. The experimental results revealed that RTL was able to significantly improve fake medical Web site detection performance over 19 comparison content and graph-based methods, various meta-learning techniques, and existing adaptive learning approaches, with an overall accuracy of over 94\%. Moreover, RTL was able to attain high performance levels even when the training dataset composed of as little as 30 Web sites. With the increased popularity of eHealth and Health 2.0, the results have important implications for online trust, security, and public safety.", acknowledgement = ack-nhfb, articleno = "22", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Adomavicius:2012:SRA, author = "Gediminas Adomavicius and Jingjing Zhang", title = "Stability of Recommendation Algorithms", journal = j-TOIS, volume = "30", number = "4", pages = "23:1--23:??", month = nov, year = "2012", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2382438.2382442", ISSN = "1046-8188", bibdate = "Tue Nov 27 17:48:53 MST 2012", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The article explores stability as a new measure of recommender systems performance. Stability is defined to measure the extent to which a recommendation algorithm provides predictions that are consistent with each other. Specifically, for a stable algorithm, adding some of the algorithm's own predictions to the algorithm's training data (for example, if these predictions were confirmed as accurate by users) would not invalidate or change the other predictions. While stability is an interesting theoretical property that can provide additional understanding about recommendation algorithms, we believe stability to be a desired practical property for recommender systems designers as well, because unstable recommendations can potentially decrease users' trust in recommender systems and, as a result, reduce users' acceptance of recommendations. In this article, we also provide an extensive empirical evaluation of stability for six popular recommendation algorithms on four real-world datasets. Our results suggest that stability performance of individual recommendation algorithms is consistent across a variety of datasets and settings. In particular, we find that model-based recommendation algorithms consistently demonstrate higher stability than neighborhood-based collaborative filtering techniques. In addition, we perform a comprehensive empirical analysis of many important factors (e.g., the sparsity of original rating data, normalization of input data, the number of new incoming ratings, the distribution of incoming ratings, the distribution of evaluation data, etc.) and report the impact they have on recommendation stability.", acknowledgement = ack-nhfb, articleno = "23", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Fu:2012:SSL, author = "Tianjun Fu and Ahmed Abbasi and Daniel Zeng and Hsinchun Chen", title = "Sentimental Spidering: Leveraging Opinion Information in Focused Crawlers", journal = j-TOIS, volume = "30", number = "4", pages = "24:1--24:??", month = nov, year = "2012", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2382438.2382443", ISSN = "1046-8188", bibdate = "Tue Nov 27 17:48:53 MST 2012", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Despite the increased prevalence of sentiment-related information on the Web, there has been limited work on focused crawlers capable of effectively collecting not only topic-relevant but also sentiment-relevant content. In this article, we propose a novel focused crawler that incorporates topic and sentiment information as well as a graph-based tunneling mechanism for enhanced collection of opinion-rich Web content regarding a particular topic. The graph-based sentiment (GBS) crawler uses a text classifier that employs both topic and sentiment categorization modules to assess the relevance of candidate pages. This information is also used to label nodes in web graphs that are employed by the tunneling mechanism to improve collection recall. Experimental results on two test beds revealed that GBS was able to provide better precision and recall than seven comparison crawlers. Moreover, GBS was able to collect a large proportion of the relevant content after traversing far fewer pages than comparison methods. GBS outperformed comparison methods on various categories of Web pages in the test beds, including collection of blogs, Web forums, and social networking Web site content. Further analysis revealed that both the sentiment classification module and graph-based tunneling mechanism played an integral role in the overall effectiveness of the GBS crawler.", acknowledgement = ack-nhfb, articleno = "24", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{You:2012:EET, author = "Gae-Won You and Seung-Won Hwang and Young-In Song and Long Jiang and Zaiqing Nie", title = "Efficient Entity Translation Mining: a Parallelized Graph Alignment Approach", journal = j-TOIS, volume = "30", number = "4", pages = "25:1--25:??", month = nov, year = "2012", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2382438.2382444", ISSN = "1046-8188", bibdate = "Tue Nov 27 17:48:53 MST 2012", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "This article studies the problem of mining entity translation, specifically, mining English and Chinese name pairs. Existing efforts can be categorized into (a) transliteration-based approaches that leverage phonetic similarity and (b) corpus-based approaches that exploit bilingual cooccurrences. These approaches suffer from inaccuracy and scarcity, respectively. In clear contrast, we use under-leveraged resources of monolingual entity cooccurrences crawled from entity search engines, which are represented as two entity-relationship graphs extracted from two language corpora, respectively. Our problem is then abstracted as finding correct mappings across two graphs. To achieve this goal, we propose a holistic approach to exploiting both transliteration similarity and monolingual cooccurrences. This approach, which builds upon monolingual corpora, complements existing corpus-based work requiring scarce resources of parallel or comparable corpus while significantly boosting the accuracy of transliteration-based work. In addition, by parallelizing the mapping process on multicore architectures, we speed up the computation by more than 10 times per unit accuracy. We validated the effectiveness and efficiency of our proposed approach using real-life datasets.", acknowledgement = ack-nhfb, articleno = "25", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Gerani:2012:AMP, author = "Shima Gerani and Mark Carman and Fabio Crestani", title = "Aggregation Methods for Proximity-Based Opinion Retrieval", journal = j-TOIS, volume = "30", number = "4", pages = "26:1--26:??", month = nov, year = "2012", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2382438.2382445", ISSN = "1046-8188", bibdate = "Tue Nov 27 17:48:53 MST 2012", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The enormous amount of user-generated data available on the Web provides a great opportunity to understand, analyze, and exploit people's opinions on different topics. Traditional Information Retrieval methods consider the relevance of documents to a topic but are unable to differentiate between subjective and objective documents. Opinion retrieval is a retrieval task in which not only the relevance of a document to the topic is important but also the amount of opinion expressed in the document about the topic. In this article, we address the blog post opinion retrieval task and propose methods that rank blog posts according to their relevance and opinionatedness toward a topic. We propose estimating the opinion density at each position in a document using a general opinion lexicon and kernel density functions. We propose and investigate different models for aggregating the opinion density at query terms positions to estimate the opinion score of every document. We then combine the opinion score with the relevance score based on a probabilistic justification. Experimental results on the BLOG06 dataset show that the proposed method provides significant improvement over the standard TREC baselines. The proposed models also achieve much higher performance compared to all state of the art methods.", acknowledgement = ack-nhfb, articleno = "26", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Callan:2012:TRO, author = "Jamie Callan", title = "{TOIS} Reviewers: {October 2009} to {September 2012}", journal = j-TOIS, volume = "30", number = "4", pages = "27:1--27:??", month = nov, year = "2012", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2382438.2382446", ISSN = "1046-8188", bibdate = "Tue Nov 27 17:48:53 MST 2012", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, articleno = "27", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Kim:2013:EDE, author = "Jinhan Kim and Sanghoon Lee and Seung-Won Hwang and Sunghun Kim", title = "Enriching Documents with Examples: a Corpus Mining Approach", journal = j-TOIS, volume = "31", number = "1", pages = "1:1--1:??", month = jan, year = "2013", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2414782.2414783", ISSN = "1046-8188", bibdate = "Wed Jan 30 11:36:49 MST 2013", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Software developers increasingly rely on information from the Web, such as documents or code examples on application programming interfaces (APIs), to facilitate their development processes. However, API documents often do not include enough information for developers to fully understand how to use the APIs, and searching for good code examples requires considerable effort. To address this problem, we propose a novel code example recommendation system that combines the strength of browsing documents and searching for code examples and returns API documents embedded with high-quality code example summaries mined from the Web. Our evaluation results show that our approach provides code examples with high precision and boosts programmer productivity.", acknowledgement = ack-nhfb, articleno = "1", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Webber:2013:ARC, author = "William Webber", title = "Approximate Recall Confidence Intervals", journal = j-TOIS, volume = "31", number = "1", pages = "2:1--2:??", month = jan, year = "2013", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2414782.2414784", ISSN = "1046-8188", bibdate = "Wed Jan 30 11:36:49 MST 2013", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Recall, the proportion of relevant documents retrieved, is an important measure of effectiveness in information retrieval, particularly in the legal, patent, and medical domains. Where document sets are too large for exhaustive relevance assessment, recall can be estimated by assessing a random sample of documents, but an indication of the reliability of this estimate is also required. In this article, we examine several methods for estimating two-tailed recall confidence intervals. We find that the normal approximation in current use provides poor coverage in many circumstances, even when adjusted to correct its inappropriate symmetry. Analytic and Bayesian methods based on the ratio of binomials are generally more accurate but are inaccurate on small populations. The method we recommend derives beta-binomial posteriors on retrieved and unretrieved yield, with fixed hyperparameters, and a Monte Carlo estimate of the posterior distribution of recall. We demonstrate that this method gives mean coverage at or near the nominal level, across several scenarios, while being balanced and stable. We offer advice on sampling design, including the allocation of assessments to the retrieved and unretrieved segments, and compare the proposed beta-binomial with the officially reported normal intervals for recent TREC Legal Track iterations.", acknowledgement = ack-nhfb, articleno = "2", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Costa:2013:XCA, author = "Gianni Costa and Riccardo Ortale and Ettore Ritacco", title = "{X}-Class: Associative Classification of {XML} Documents by Structure", journal = j-TOIS, volume = "31", number = "1", pages = "3:1--3:??", month = jan, year = "2013", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2414782.2414785", ISSN = "1046-8188", bibdate = "Wed Jan 30 11:36:49 MST 2013", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The supervised classification of XML documents by structure involves learning predictive models in which certain structural regularities discriminate the individual document classes. Hitherto, research has focused on the adoption of prespecified substructures. This is detrimental for classification effectiveness, since the a priori chosen substructures may not accord with the structural properties of the XML documents. Therein, an unexplored question is how to choose the type of structural regularity that best adapts to the structures of the available XML documents. We tackle this problem through X-Class, an approach that handles all types of tree-like substructures and allows for choosing the most discriminatory one. Algorithms are designed to learn compact rule-based classifiers in which the chosen substructures discriminate the classes of XML documents. X-Class is studied across various domains and types of substructures. Its classification performance is compared against several rule-based and SVM-based competitors. Empirical evidence reveals that the classifiers induced by X-Class are compact, scalable, and at least as effective as the established competitors. In particular, certain substructures allow the induction of very compact classifiers that generally outperform the rule-based competitors in terms of effectiveness over all chosen corpora of XML data. Furthermore, such classifiers are substantially as effective as the SVM-based competitor, with the additional advantage of a high-degree of interpretability.", acknowledgement = ack-nhfb, articleno = "3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Yom-Tov:2013:ESP, author = "Elad Yom-Tov and Fernando Diaz", title = "The Effect of Social and Physical Detachment on Information Need", journal = j-TOIS, volume = "31", number = "1", pages = "4:1--4:??", month = jan, year = "2013", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2414782.2414786", ISSN = "1046-8188", bibdate = "Wed Jan 30 11:36:49 MST 2013", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The information need of users and the documents which answer this need are frequently contingent on the different characteristics of users. This is especially evident during natural disasters, such as earthquakes and violent weather incidents, which create a strong transient information need. In this article, we investigate how the information need of users, as expressed by their queries, is affected by their physical detachment, as estimated by their physical location in relation to that of the event, and by their social detachment, as quantified by the number of their acquaintances who may be affected by the event. Drawing on large-scale data from ten major events, we show that social and physical detachment levels of users are a major influence on their search engine queries. We demonstrate how knowing social and physical detachment levels can assist in improving retrieval for two applications: identifying search queries related to events and ranking results in response to event-related queries. We find that the average precision in identifying relevant search queries improves by approximately 18\%, and that the average precision of ranking that uses detachment information improves by 10\%. Using both types of detachment achieved a larger gain in performance than each of them separately.", acknowledgement = ack-nhfb, articleno = "4", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Wang:2013:RLS, author = "Quan Wang and Jun Xu and Hang Li and Nick Craswell", title = "Regularized Latent Semantic Indexing: a New Approach to Large-Scale Topic Modeling", journal = j-TOIS, volume = "31", number = "1", pages = "5:1--5:??", month = jan, year = "2013", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2414782.2414787", ISSN = "1046-8188", bibdate = "Wed Jan 30 11:36:49 MST 2013", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Topic modeling provides a powerful way to analyze the content of a collection of documents. It has become a popular tool in many research areas, such as text mining, information retrieval, natural language processing, and other related fields. In real-world applications, however, the usefulness of topic modeling is limited due to scalability issues. Scaling to larger document collections via parallelization is an active area of research, but most solutions require drastic steps, such as vastly reducing input vocabulary. In this article we introduce Regularized Latent Semantic Indexing (RLSI)---including a batch version and an online version, referred to as batch RLSI and online RLSI, respectively---to scale up topic modeling. Batch RLSI and online RLSI are as effective as existing topic modeling techniques and can scale to larger datasets without reducing input vocabulary. Moreover, online RLSI can be applied to stream data and can capture the dynamic evolution of topics. Both versions of RLSI formalize topic modeling as a problem of minimizing a quadratic loss function regularized by l1 and/or l2 norm. This formulation allows the learning process to be decomposed into multiple suboptimization problems which can be optimized in parallel, for example, via MapReduce. We particularly propose adopting l1 norm on topics and l2 norm on document representations to create a model with compact and readable topics and which is useful for retrieval. In learning, batch RLSI processes all the documents in the collection as a whole, while online RLSI processes the documents in the collection one by one. We also prove the convergence of the learning of online RLSI. Relevance ranking experiments on three TREC datasets show that batch RLSI and online RLSI perform better than LSI, PLSI, LDA, and NMF, and the improvements are sometimes statistically significant. Experiments on a Web dataset containing about 1.6 million documents and 7 million terms, demonstrate a similar boost in performance.", acknowledgement = ack-nhfb, articleno = "5", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Xue:2013:MRU, author = "Xiaobing Xue and W. Bruce Croft", title = "Modeling reformulation using query distributions", journal = j-TOIS, volume = "31", number = "2", pages = "6:1--6:??", month = may, year = "2013", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Fri May 17 19:16:24 MDT 2013", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Query reformulation modifies the original query with the aim of better matching the vocabulary of the relevant documents, and consequently improving ranking effectiveness. Previous models typically generate words and phrases related to the original query, but do not consider how these words and phrases would fit together in actual queries. In this article, a novel framework is proposed that models reformulation as a distribution of actual queries, where each query is a variation of the original query. This approach considers an actual query as the basic unit and thus captures important query-level dependencies between words and phrases. An implementation of this framework that only uses publicly available resources is proposed, which makes fair comparisons with other methods using TREC collections possible. Specifically, this implementation consists of a query generation step that analyzes the passages containing query words to generate reformulated queries and a probability estimation step that learns a distribution for reformulated queries by optimizing the retrieval performance. Experiments on TREC collections show that the proposed model can significantly outperform previous reformulation models.", acknowledgement = ack-nhfb, articleno = "6", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Pan:2013:TJE, author = "Sinno Jialin Pan and Zhiqiang Toh and Jian Su", title = "Transfer joint embedding for cross-domain named entity recognition", journal = j-TOIS, volume = "31", number = "2", pages = "7:1--7:??", month = may, year = "2013", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Fri May 17 19:16:24 MDT 2013", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Named Entity Recognition (NER) is a fundamental task in information extraction from unstructured text. Most previous machine-learning-based NER systems are domain-specific, which implies that they may only perform well on some specific domains (e.g., Newswire ) but tend to adapt poorly to other related but different domains (e.g., Weblog ). Recently, transfer learning techniques have been proposed to NER. However, most transfer learning approaches to NER are developed for binary classification, while NER is a multiclass classification problem in nature. Therefore, one has to first reduce the NER task to multiple binary classification tasks and solve them independently. In this article, we propose a new transfer learning method, named Transfer Joint Embedding (TJE), for cross-domain multiclass classification, which can fully exploit the relationships between classes (labels), and reduce domain difference in data distributions for transfer learning. More specifically, we aim to embed both labels (outputs) and high-dimensional features (inputs) from different domains (e.g., a source domain and a target domain) into a unified low-dimensional latent space, where (1) each label is represented by a prototype and the intrinsic relationships between labels can be measured by Euclidean distance; (2) the distance in data distributions between the source and target domains can be reduced; (3) the source domain labeled data are closer to their corresponding label-prototypes than others. After the latent space is learned, classification on the target domain data can be done with the simple nearest neighbor rule in the latent space. Furthermore, in order to scale up TJE, we propose an efficient algorithm based on stochastic gradient descent (SGD). Finally, we apply the proposed TJE method for NER across different domains on the ACE 2005 dataset, which is a benchmark in Natural Language Processing (NLP). Experimental results demonstrate the effectiveness of TJE and show that TJE can outperform state-of-the-art transfer learning approaches to NER.", acknowledgement = ack-nhfb, articleno = "7", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Ke:2013:SCP, author = "Weimao Ke and Javed Mostafa", title = "Studying the clustering paradox and scalability of search in highly distributed environments", journal = j-TOIS, volume = "31", number = "2", pages = "8:1--8:??", month = may, year = "2013", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Fri May 17 19:16:24 MDT 2013", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "With the ubiquitous production, distribution and consumption of information, today's digital environments such as the Web are increasingly large and decentralized. It is hardly possible to obtain central control over information collections and systems in these environments. Searching for information in these information spaces has brought about problems beyond traditional boundaries of information retrieval (IR) research. This article addresses one important aspect of scalability challenges facing information retrieval models and investigates a decentralized, organic view of information systems pertaining to search in large-scale networks. Drawing on observations from earlier studies, we conduct a series of experiments on decentralized searches in large-scale networked information spaces. Results show that how distributed systems interconnect is crucial to retrieval performance and scalability of searching. Particularly, in various experimental settings and retrieval tasks, we find a consistent phenomenon, namely, the Clustering Paradox, in which the level of network clustering (semantic overlay) imposes a scalability limit. Scalable searches are well supported by a specific, balanced level of network clustering emerging from local system interconnectivity. Departure from that level, either stronger or weaker clustering, leads to search performance degradation, which is dramatic in large-scale networks.", acknowledgement = ack-nhfb, articleno = "8", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Zhu:2013:SHF, author = "Xiaofeng Zhu and Zi Huang and Hong Cheng and Jiangtao Cui and Heng Tao Shen", title = "Sparse hashing for fast multimedia search", journal = j-TOIS, volume = "31", number = "2", pages = "9:1--9:??", month = may, year = "2013", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Fri May 17 19:16:24 MDT 2013", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/hash.bib; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Hash-based methods achieve fast similarity search by representing high-dimensional data with compact binary codes. However, both generating binary codes and encoding unseen data effectively and efficiently remain very challenging tasks. In this article, we focus on these tasks to implement approximate similarity search by proposing a novel hash based method named sparse hashing (SH for short). To generate interpretable (or semantically meaningful) binary codes, the proposed SH first converts original data into low-dimensional data through a novel nonnegative sparse coding method. SH then converts the low-dimensional data into Hamming space (i.e., binary encoding low-dimensional data) by a new binarization rule. After this, training data are represented by generated binary codes. To efficiently and effectively encode unseen data, SH learns hash functions by taking a-priori knowledge into account, such as implicit group effect of the features in training data, and the correlations between original space and the learned Hamming space. SH is able to perform fast approximate similarity search by efficient bit XOR operations in the memory of a modern PC with short binary code representations. Experimental results show that the proposed SH significantly outperforms state-of-the-art techniques.", acknowledgement = ack-nhfb, articleno = "9", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Bast:2013:EFS, author = "Hannah Bast and Marjan Celikik", title = "Efficient fuzzy search in large text collections", journal = j-TOIS, volume = "31", number = "2", pages = "10:1--10:??", month = may, year = "2013", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Fri May 17 19:16:24 MDT 2013", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/string-matching.bib; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "We consider the problem of fuzzy full-text search in large text collections, that is, full-text search which is robust against errors both on the side of the query as well as on the side of the documents. Standard inverted-index techniques work extremely well for ordinary full-text search but fail to achieve interactive query times (below 100 milliseconds) for fuzzy full-text search even on moderately-sized text collections (above 10 GBs of text). We present new preprocessing techniques that achieve interactive query times on large text collections (100 GB of text, served by a single machine). We consider two similarity measures, one where the query terms match similar terms in the collection (e.g., algorithm matches algoritm or vice versa) and one where the query terms match terms with a similar prefix in the collection (e.g., alori matches algorithm). The latter is important when we want to display results instantly after each keystroke (search as you type). All algorithms have been fully integrated into the CompleteSearch engine.", acknowledgement = ack-nhfb, articleno = "10", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Macdonald:2013:ALM, author = "Craig Macdonald and Rodrygo L. T. Santos and Iadh Ounis and Ben He", title = "About learning models with multiple query-dependent features", journal = j-TOIS, volume = "31", number = "3", pages = "11:1--11:??", month = jul, year = "2013", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2493175.2493176", ISSN = "1046-8188", bibdate = "Wed Jul 31 12:16:17 MDT 2013", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Several questions remain unanswered by the existing literature concerning the deployment of query-dependent features within learning to rank. In this work, we investigate three research questions in order to empirically ascertain best practices for learning-to-rank deployments. (i) Previous work in data fusion that pre-dates learning to rank showed that while different retrieval systems could be effectively combined, the combination of multiple models within the same system was not as effective. In contrast, the existing learning-to-rank datasets (e.g., LETOR), often deploy multiple weighting models as query-dependent features within a single system, raising the question as to whether such a combination is needed. (ii) Next, we investigate whether the training of weighting model parameters, traditionally required for effective retrieval, is necessary within a learning-to-rank context. (iii) Finally, we note that existing learning-to-rank datasets use weighting model features calculated on different fields (e.g., title, content, or anchor text), even though such weighting models have been criticized in the literature. Experiments addressing these three questions are conducted on Web search datasets, using various weighting models as query-dependent and typical query-independent features, which are combined using three learning-to-rank techniques. In particular, we show and explain why multiple weighting models should be deployed as features. Moreover, we unexpectedly find that training the weighting model's parameters degrades learned model's effectiveness. Finally, we show that computing a weighting model separately for each field is less effective than more theoretically-sound field-based weighting models.", acknowledgement = ack-nhfb, articleno = "11", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Hou:2013:MPH, author = "Yuexian Hou and Xiaozhao Zhao and Dawei Song and Wenjie Li", title = "Mining pure high-order word associations via information geometry for information retrieval", journal = j-TOIS, volume = "31", number = "3", pages = "12:1--12:??", month = jul, year = "2013", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2493175.2493177", ISSN = "1046-8188", bibdate = "Wed Jul 31 12:16:17 MDT 2013", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The classical bag-of-word models for information retrieval (IR) fail to capture contextual associations between words. In this article, we propose to investigate pure high-order dependence among a number of words forming an unseparable semantic entity, that is, the high-order dependence that cannot be reduced to the random coincidence of lower-order dependencies. We believe that identifying these pure high-order dependence patterns would lead to a better representation of documents and novel retrieval models. Specifically, two formal definitions of pure dependence-unconditional pure dependence (UPD) and conditional pure dependence (CPD)-are defined. The exact decision on UPD and CPD, however, is NP-hard in general. We hence derive and prove the sufficient criteria that entail UPD and CPD, within the well-principled information geometry (IG) framework, leading to a more feasible UPD/CPD identification procedure. We further develop novel methods for extracting word patterns with pure high-order dependence. Our methods are applied to and extensively evaluated on three typical IR tasks: text classification and text retrieval without and with query expansion.", acknowledgement = ack-nhfb, articleno = "12", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Asadi:2013:FCG, author = "Nima Asadi and Jimmy Lin", title = "Fast candidate generation for real-time tweet search with {Bloom} filter chains", journal = j-TOIS, volume = "31", number = "3", pages = "13:1--13:??", month = jul, year = "2013", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2493175.2493178", ISSN = "1046-8188", bibdate = "Wed Jul 31 12:16:17 MDT 2013", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The rise of social media and other forms of user-generated content have created the demand for real-time search: against a high-velocity stream of incoming documents, users desire a list of relevant results at the time the query is issued. In the context of real-time search on tweets, this work explores candidate generation in a two-stage retrieval architecture where an initial list of results is processed by a second-stage rescorer to produce the final output. We introduce Bloom filter chains, a novel extension of Bloom filters that can dynamically expand to efficiently represent an arbitrarily long and growing list of monotonically-increasing integers with a constant false positive rate. Using a collection of Bloom filter chains, a novel approximate candidate generation algorithm called BWand is able to perform both conjunctive and disjunctive retrieval. Experiments show that our algorithm is many times faster than competitive baselines and that this increased performance does not require sacrificing end-to-end effectiveness. Our results empirically characterize the trade-off space defined by output quality, query evaluation speed, and memory footprint for this particular search architecture.", acknowledgement = ack-nhfb, articleno = "13", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Lucchese:2013:DTS, author = "Claudio Lucchese and Salvatore Orlando and Raffaele Perego and Fabrizio Silvestri and Gabriele Tolomei", title = "Discovering tasks from search engine query logs", journal = j-TOIS, volume = "31", number = "3", pages = "14:1--14:??", month = jul, year = "2013", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2493175.2493179", ISSN = "1046-8188", bibdate = "Wed Jul 31 12:16:17 MDT 2013", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Although Web search engines still answer user queries with lists of ten blue links to webpages, people are increasingly issuing queries to accomplish their daily tasks (e.g., finding a recipe, booking a flight, reading online news, etc.). In this work, we propose a two-step methodology for discovering tasks that users try to perform through search engines. First, we identify user tasks from individual user sessions stored in search engine query logs. In our vision, a user task is a set of possibly noncontiguous queries (within a user search session), which refer to the same need. Second, we discover collective tasks by aggregating similar user tasks, possibly performed by distinct users. To discover user tasks, we propose query similarity functions based on unsupervised and supervised learning approaches. We present a set of query clustering methods that exploit these functions in order to detect user tasks. All the proposed solutions were evaluated on a manually-built ground truth, and two of them performed better than state-of-the-art approaches. To detect collective tasks, we propose four methods that cluster previously discovered user tasks, which in turn are represented by the bag-of-words extracted from their composing queries. These solutions were also evaluated on another manually-built ground truth.", acknowledgement = ack-nhfb, articleno = "14", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Nong:2013:PLT, author = "Ge Nong", title = "Practical linear-time {$ O(1) $}-workspace suffix sorting for constant alphabets", journal = j-TOIS, volume = "31", number = "3", pages = "15:1--15:??", month = jul, year = "2013", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2493175.2493180", ISSN = "1046-8188", bibdate = "Wed Jul 31 12:16:17 MDT 2013", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "This article presents an {$ O(n) $}-time algorithm called SACA-K for sorting the suffixes of an input string {$ T[0, n - 1] $} over an alphabet {$ A[0, K - 1] $}. The problem of sorting the suffixes of {$T$} is also known as constructing the suffix array (SA) for {$T$}. The theoretical memory usage of SACA-{$K$} is {$ n \log K + n \log n + K \log n $} bits. Moreover, we also have a practical implementation for SACA-{$K$} that uses $n$ bytes + $ (n + 256) $ words and is suitable for strings over any alphabet up to full ASCII, where a word is $ \log n $ bits. In our experiment, SACA-{$K$} outperforms SA-IS that was previously the most time- and space-efficient linear-time SA construction algorithm (SACA). SACA-{$K$} is around 33\% faster and uses a smaller deterministic workspace of {$K$} words, where the workspace is the space needed beyond the input string and the output SA. Given {$ K = O(1) $}, SACA-{$K$} runs in linear time and {$ O(1) $} workspace. To the best of our knowledge, such a result is the first reported in the literature with a practical source code publicly available.", acknowledgement = ack-nhfb, articleno = "15", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Radinsky:2013:BDW, author = "Kira Radinsky and Krysta M. Svore and Susan T. Dumais and Milad Shokouhi and Jaime Teevan and Alex Bocharov and Eric Horvitz", title = "Behavioral dynamics on the {Web}: Learning, modeling, and prediction", journal = j-TOIS, volume = "31", number = "3", pages = "16:1--16:??", month = jul, year = "2013", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2493175.2493181", ISSN = "1046-8188", bibdate = "Wed Jul 31 12:16:17 MDT 2013", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The queries people issue to a search engine and the results clicked following a query change over time. For example, after the earthquake in Japan in March 2011, the query {\em Japan\/} spiked in popularity and people issuing the query were more likely to click government-related results than they would prior to the earthquake. We explore the modeling and prediction of such temporal patterns in Web search behavior. We develop a temporal modeling framework adapted from physics and signal processing and harness it to predict temporal patterns in search behavior using smoothing, trends, periodicities, and surprises. Using current and past behavioral data, we develop a learning procedure that can be used to construct models of users' Web search activities. We also develop a novel methodology that learns to select the best prediction model from a family of predictive models for a given query or a class of queries. Experimental results indicate that the predictive models significantly outperform baseline models that weight historical evidence the same for all queries. We present two applications where new methods introduced for the temporal modeling of user behavior significantly improve upon the state of the art. Finally, we discuss opportunities for using models of temporal dynamics to enhance other areas of Web search and information retrieval.", acknowledgement = ack-nhfb, articleno = "16", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Hofmann:2013:FSE, author = "Katja Hofmann and Shimon Whiteson and Maarten {De Rijke}", title = "Fidelity, Soundness, and Efficiency of Interleaved Comparison Methods", journal = j-TOIS, volume = "31", number = "4", pages = "17:1--17:??", month = nov, year = "2013", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2536736.2536737", ISSN = "1046-8188", bibdate = "Tue Dec 3 18:39:19 MST 2013", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Ranker evaluation is central to the research into search engines, be it to compare rankers or to provide feedback for learning to rank. Traditional evaluation approaches do not scale well because they require explicit relevance judgments of document-query pairs, which are expensive to obtain. A promising alternative is the use of interleaved comparison methods, which compare rankers using click data obtained when interleaving their rankings. In this article, we propose a framework for analyzing interleaved comparison methods. An interleaved comparison method has fidelity if the expected outcome of ranker comparisons properly corresponds to the true relevance of the ranked documents. It is sound if its estimates of that expected outcome are unbiased and consistent. It is efficient if those estimates are accurate with only little data. We analyze existing interleaved comparison methods and find that, while sound, none meet our criteria for fidelity. We propose a probabilistic interleave method, which is sound and has fidelity. We show empirically that, by marginalizing out variables that are known, it is more efficient than existing interleaved comparison methods. Using importance sampling we derive a sound extension that is able to reuse historical data collected in previous comparisons of other ranker pairs.", acknowledgement = ack-nhfb, articleno = "17", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Paik:2013:ERQ, author = "Jiaul H. Paik and Swapan K. Parui and Dipasree Pal and Stephen E. Robertson", title = "Effective and Robust Query-Based Stemming", journal = j-TOIS, volume = "31", number = "4", pages = "18:1--18:??", month = nov, year = "2013", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2536736.2536738", ISSN = "1046-8188", bibdate = "Tue Dec 3 18:39:19 MST 2013", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Stemming is a widely used technique in information retrieval systems to address the vocabulary mismatch problem arising out of morphological phenomena. The major shortcoming of the commonly used stemmers is that they accept the morphological variants of the query words without considering their thematic coherence with the given query, which leads to poor performance. Moreover, for many queries, such approaches also produce retrieval performance that is poorer than no stemming, thereby degrading the robustness. The main goal of this article is to present corpus-based fully automatic stemming algorithms which address these issues. A set of experiments on six TREC collections and three other non-English collections containing news and web documents shows that the proposed query-based stemming algorithms consistently and significantly outperform four state of the art strong stemmers of completely varying principles. Our experiments also confirm that the robustness of the proposed query-based stemming algorithms are remarkably better than the existing strong baselines.", acknowledgement = ack-nhfb, articleno = "18", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Esuli:2013:ITC, author = "Andrea Esuli and Fabrizio Sebastiani", title = "Improving Text Classification Accuracy by Training Label Cleaning", journal = j-TOIS, volume = "31", number = "4", pages = "19:1--19:??", month = nov, year = "2013", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2516889", ISSN = "1046-8188", bibdate = "Tue Dec 3 18:39:19 MST 2013", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "In text classification (TC) and other tasks involving supervised learning, labelled data may be scarce or expensive to obtain. Semisupervised learning and active learning are two strategies whose aim is maximizing the effectiveness of the resulting classifiers for a given amount of training effort. Both strategies have been actively investigated for TC in recent years. Much less research has been devoted to a third such strategy, training label cleaning (TLC), which consists in devising ranking functions that sort the original training examples in terms of how likely it is that the human annotator has mislabelled them. This provides a convenient means for the human annotator to revise the training set so as to improve its quality. Working in the context of boosting-based learning methods for multilabel classification we present three different techniques for performing TLC and, on three widely used TC benchmarks, evaluate them by their capability of spotting training documents that, for experimental reasons only, we have purposefully mislabelled. We also evaluate the degradation in classification effectiveness that these mislabelled texts bring about, and to what extent training label cleaning can prevent this degradation.", acknowledgement = ack-nhfb, articleno = "19", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Chelmis:2013:SLP, author = "Charalampos Chelmis and Viktor K. Prasanna", title = "Social Link Prediction in Online Social Tagging Systems", journal = j-TOIS, volume = "31", number = "4", pages = "20:1--20:??", month = nov, year = "2013", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2516891", ISSN = "1046-8188", bibdate = "Tue Dec 3 18:39:19 MST 2013", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Social networks have become a popular medium for people to communicate and distribute ideas, content, news, and advertisements. Social content annotation has naturally emerged as a method of categorization and filtering of online information. The unrestricted vocabulary users choose from to annotate content has often lead to an explosion of the size of space in which search is performed. In this article, we propose latent topic models as a principled way of reducing the dimensionality of such data and capturing the dynamics of collaborative annotation process. We propose three generative processes to model latent user tastes with respect to resources they annotate with metadata. We show that latent user interests combined with social clues from the immediate neighborhood of users can significantly improve social link prediction in the online music social media site Last.fm. Most link prediction methods suffer from the high class imbalance problem, resulting in low precision and/or recall. In contrast, our proposed classification schemes for social link recommendation achieve high precision and recall with respect to not only the dominant class (nonexistence of a link), but also with respect to sparse positive instances, which are the most vital in social tie prediction.", acknowledgement = ack-nhfb, articleno = "20", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Jia:2013:ISD, author = "Lifeng Jia and Clement Yu and Weiyi Meng", title = "The Impacts of Structural Difference and Temporality of Tweets on Retrieval Effectiveness", journal = j-TOIS, volume = "31", number = "4", pages = "21:1--21:??", month = nov, year = "2013", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2500751", ISSN = "1046-8188", bibdate = "Tue Dec 3 18:39:19 MST 2013", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "To explore the information seeking behaviors in microblogosphere, the microblog track at TREC 2011 introduced a real-time ad-hoc retrieval task that aims at ranking relevant tweets in reverse-chronological order. We study this problem via a two-phase approach: (1) retrieving tweets in an ad-hoc way; (2) utilizing the temporal information of tweets to enhance the retrieval effectiveness of tweets. Tweets can be categorized into two types. One type consists of short messages not containing any URL of a Web page. The other type has at least one URL of a Web page in addition to a short message. These two types of tweets have different structures. In the first phase, to address the structural difference of tweets, we propose a method to rank tweets using the divide-and-conquer strategy. Specifically, we first rank the two types of tweets separately. This produces two rankings, one for each type. Then we merge these two rankings of tweets into one ranking. In the second phase, we first categorize queries into several types by exploring the temporal distributions of their top-retrieved tweets from the first phase; then we calculate the time-related relevance scores of tweets according to the classified types of queries; finally we combine the time scores with the IR scores from the first phase to produce a ranking of tweets. Experimental results achieved by using the TREC 2011 and TREC 2012 queries over the TREC Tweets2011 collection show that: (i) our way of ranking the two types of tweets separately and then merging them together yields better retrieval effectiveness than ranking them simultaneously; (ii) our way of incorporating temporal information into the retrieval process yields further improvements, and (iii) our method compares favorably with state-of-the-art methods in retrieval effectiveness.", acknowledgement = ack-nhfb, articleno = "21", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Chiu:2013:EVS, author = "Chih-Yi Chiu and Tsung-Han Tsai and Guei-Wun Han and Cheng-Yu Hsieh and Sheng-Yang Li", title = "Efficient Video Stream Monitoring for Near-Duplicate Detection and Localization in a Large-Scale Repository", journal = j-TOIS, volume = "31", number = "4", pages = "22:1--22:??", month = nov, year = "2013", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2516890", ISSN = "1046-8188", bibdate = "Tue Dec 3 18:39:19 MST 2013", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "In this article, we study the efficiency problem of video stream near-duplicate monitoring in a large-scale repository. Existing stream monitoring methods are mainly designed for a short video to scan over a query stream; they have difficulty being scalable for a large number of long videos. We present a simple but effective algorithm called incremental similarity update to address the problem. That is, a similarity upper bound between two videos can be calculated incrementally by leveraging the prior knowledge of the previous calculation. The similarity upper bound takes a lightweight computation to filter out unnecessary time-consuming computation for the actual similarity between two videos, making the search process more efficient. We integrate the algorithm with inverted indexing to obtain a candidate list from the repository for the given query stream. Meanwhile, the algorithm is applied to scan each candidate for locating exact near-duplicate subsequences. We implement several state-of-the-art methods for comparison in terms of accuracy, execution time, and memory consumption. Experimental results demonstrate the proposed algorithm yields comparable accuracy, compact memory size, and more efficient execution time.", acknowledgement = ack-nhfb, articleno = "22", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Nong:2014:SAC, author = "Ge Nong and Wai Hong Chan and Sen Zhang and Xiao Feng Guan", title = "Suffix Array Construction in External Memory Using {D}-Critical Substrings", journal = j-TOIS, volume = "32", number = "1", pages = "1:1--1:??", month = jan, year = "2014", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2518175", ISSN = "1046-8188", bibdate = "Tue Jan 28 17:40:54 MST 2014", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "We present a new suffix array construction algorithm that aims to build, in external memory, the suffix array for an input string of length n measured in the magnitude of tens of Giga characters over a constant or integer alphabet. The core of this algorithm is adapted from the framework of the original internal memory SA-DS algorithm that samples fixed-size $d$-critical substrings. This new external-memory algorithm, called EM-SA-DS, uses novel cache data structures to construct a suffix array in a sequential scanning manner with good data spatial locality: data is read from or written to disk sequentially. On the assumed external-memory model with RAM capacity $ \Omega ((n B)^{0.5}) $, disk capacity $ O(n) $, and size of each I/O block B, all measured in $ \log n $-bit words, the I/O complexity of EM-SA-DS is $ O(n / B) $. This work provides a general cache-based solution that could be further exploited to develop external-memory solutions for other suffix-array-related problems, for example, computing the longest-common-prefix array, using a modern personal computer with a typical memory configuration of 4GB RAM and a single disk.", acknowledgement = ack-nhfb, articleno = "1", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Cummins:2014:DSD, author = "Ronan Cummins", title = "Document Score Distribution Models for Query Performance Inference and Prediction", journal = j-TOIS, volume = "32", number = "1", pages = "2:1--2:??", month = jan, year = "2014", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2559170", ISSN = "1046-8188", bibdate = "Tue Jan 28 17:40:54 MST 2014", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Modelling the distribution of document scores returned from an information retrieval (IR) system in response to a query is of both theoretical and practical importance. One of the goals of modelling document scores in this manner is the inference of document relevance. There has been renewed interest of late in modelling document scores using parameterised distributions. Consequently, a number of hypotheses have been proposed to constrain the mixture distribution from which document scores could be drawn. In this article, we show how a standard performance measure (i.e., average precision) can be inferred from a document score distribution using labelled data. We use the accuracy of the inference of average precision as a measure for determining the usefulness of a particular model of document scores. We provide a comprehensive study which shows that certain mixtures of distributions are able to infer average precision more accurately than others. Furthermore, we analyse a number of mixture distributions with regard to the recall-fallout convexity hypothesis and show that the convexity hypothesis is practically useful. Consequently, based on one of the best-performing score-distribution models, we develop some techniques for query-performance prediction (QPP) by automatically estimating the parameters of the document score-distribution model when relevance information is unknown. We present experimental results that outline the benefits of this approach to query-performance prediction.", acknowledgement = ack-nhfb, articleno = "2", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Huston:2014:IWS, author = "Samuel Huston and J. Shane Culpepper and W. Bruce Croft", title = "Indexing Word Sequences for Ranked Retrieval", journal = j-TOIS, volume = "32", number = "1", pages = "3:1--3:??", month = jan, year = "2014", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2559168", ISSN = "1046-8188", bibdate = "Tue Jan 28 17:40:54 MST 2014", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Formulating and processing phrases and other term dependencies to improve query effectiveness is an important problem in information retrieval. However, accessing word-sequence statistics using inverted indexes requires unreasonable processing time or substantial space overhead. Establishing a balance between these competing space and time trade-offs can dramatically improve system performance. In this article, we present and analyze a new index structure designed to improve query efficiency in dependency retrieval models. By adapting a class of $ (\epsilon, \delta) $-approximation algorithms originally proposed for sketch summarization in networking applications, we show how to accurately estimate statistics important in term-dependency models with low, probabilistically bounded error rates. The space requirements for the vocabulary of the index is only logarithmically linked to the size of the vocabulary. Empirically, we show that the sketch index can reduce the space requirements of the vocabulary component of an index of n -grams consisting of between 1 and 4 words extracted from the GOV2 collection to less than 0.01\% of the space requirements of the vocabulary of a full index. We also show that larger $n$-gram queries can be processed considerably more efficiently than in current alternatives, such as positional and next-word indexes.", acknowledgement = ack-nhfb, articleno = "3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Ge:2014:CAC, author = "Yong Ge and Hui Xiong and Alexander Tuzhilin and Qi Liu", title = "Cost-Aware Collaborative Filtering for Travel Tour Recommendations", journal = j-TOIS, volume = "32", number = "1", pages = "4:1--4:??", month = jan, year = "2014", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2559169", ISSN = "1046-8188", bibdate = "Tue Jan 28 17:40:54 MST 2014", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Advances in tourism economics have enabled us to collect massive amounts of travel tour data. If properly analyzed, this data could be a source of rich intelligence for providing real-time decision making and for the provision of travel tour recommendations. However, tour recommendation is quite different from traditional recommendations, because the tourist's choice is affected directly by the travel costs, which includes both financial and time costs. To that end, in this article, we provide a focused study of cost-aware tour recommendation. Along this line, we first propose two ways to represent user cost preference. One way is to represent user cost preference by a two-dimensional vector. Another way is to consider the uncertainty about the cost that a user can afford and introduce a Gaussian prior to model user cost preference. With these two ways of representing user cost preference, we develop different cost-aware latent factor models by incorporating the cost information into the probabilistic matrix factorization (PMF) model, the logistic probabilistic matrix factorization (LPMF) model, and the maximum margin matrix factorization (MMMF) model, respectively. When applied to real-world travel tour data, all the cost-aware recommendation models consistently outperform existing latent factor models with a significant margin.", acknowledgement = ack-nhfb, articleno = "4", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Nie:2014:LRD, author = "Liqiang Nie and Yi-Liang Zhao and Xiangyu Wang and Jialie Shen and Tat-Seng Chua", title = "Learning to Recommend Descriptive Tags for Questions in Social Forums", journal = j-TOIS, volume = "32", number = "1", pages = "5:1--5:??", month = jan, year = "2014", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2559157", ISSN = "1046-8188", bibdate = "Tue Jan 28 17:40:54 MST 2014", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Around 40\% of the questions in the emerging social-oriented question answering forums have at most one manually labeled tag, which is caused by incomprehensive question understanding or informal tagging behaviors. The incompleteness of question tags severely hinders all the tag-based manipulations, such as feeds for topic-followers, ontological knowledge organization, and other basic statistics. This article presents a novel scheme that is able to comprehensively learn descriptive tags for each question. Extensive evaluations on a representative real-world dataset demonstrate that our scheme yields significant gains for question annotation, and more importantly, the whole process of our approach is unsupervised and can be extended to handle large-scale data.", acknowledgement = ack-nhfb, articleno = "5", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Bast:2014:EIB, author = "Hannah Bast and Marjan Celikik", title = "Efficient Index-Based Snippet Generation", journal = j-TOIS, volume = "32", number = "2", pages = "6:1--6:??", month = apr, year = "2014", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2590972", ISSN = "1046-8188", bibdate = "Tue Apr 22 17:59:17 MDT 2014", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Ranked result lists with query-dependent snippets have become state of the art in text search. They are typically implemented by searching, at query time, for occurrences of the query words in the top-ranked documents. This document-based approach has three inherent problems: (i) when a document is indexed by terms which it does not contain literally (e.g., related words or spelling variants), localization of the corresponding snippets becomes problematic; (ii) each query operator (e.g., phrase or proximity search) has to be implemented twice, on the index side in order to compute the correct result set, and on the snippet-generation side to generate the appropriate snippets; and (iii) in a worst case, the whole document needs to be scanned for occurrences of the query words, which could be problematic for very long documents. We present a new index-based method that localizes snippets by information solely computed from the index and that overcomes all three problems. Unlike previous index-based methods, we show how to achieve this at essentially no extra cost in query processing time, by a technique we call operator inversion. We also show how our index-based method allows the caching of individual segments instead of complete documents, which enables a significantly larger cache hit-ratio as compared to the document-based approach. We have fully integrated our implementation with the CompleteSearch engine.", acknowledgement = ack-nhfb, articleno = "6", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Zhao:2014:MTA, author = "Jiashu Zhao and Jimmy Xiangji Huang and Zheng Ye", title = "Modeling Term Associations for Probabilistic Information Retrieval", journal = j-TOIS, volume = "32", number = "2", pages = "7:1--7:??", month = apr, year = "2014", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2590988", ISSN = "1046-8188", bibdate = "Tue Apr 22 17:59:17 MDT 2014", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Traditionally, in many probabilistic retrieval models, query terms are assumed to be independent. Although such models can achieve reasonably good performance, associations can exist among terms from a human being's point of view. There are some recent studies that investigate how to model term associations/dependencies by proximity measures. However, the modeling of term associations theoretically under the probabilistic retrieval framework is still largely unexplored. In this article, we introduce a new concept cross term, to model term proximity, with the aim of boosting retrieval performance. With cross terms, the association of multiple query terms can be modeled in the same way as a simple unigram term. In particular, an occurrence of a query term is assumed to have an impact on its neighboring text. The degree of the query-term impact gradually weakens with increasing distance from the place of occurrence. We use shape functions to characterize such impacts. Based on this assumption, we first propose a bigram CRoss TErm Retrieval ( CRTER$_2$ ) model as the basis model, and then recursively propose a generalized n-gram CRoss TErm Retrieval ( CRTER$_n$ ) model for n query terms, where n {$>$} 2. Specifically, a bigram cross term occurs when the corresponding query terms appear close to each other, and its impact can be modeled by the intersection of the respective shape functions of the query terms. For an n-gram cross term, we develop several distance metrics with different properties and employ them in the proposed models for ranking. We also show how to extend the language model using the newly proposed cross terms. Extensive experiments on a number of TREC collections demonstrate the effectiveness of our proposed models.", acknowledgement = ack-nhfb, articleno = "7", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Cui:2014:SSI, author = "Peng Cui and Shao-Wei Liu and Wen-Wu Zhu and Huan-Bo Luan and Tat-Seng Chua and Shi-Qiang Yang", title = "Social-Sensed Image Search", journal = j-TOIS, volume = "32", number = "2", pages = "8:1--8:??", month = apr, year = "2014", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2590974", ISSN = "1046-8188", bibdate = "Tue Apr 22 17:59:17 MDT 2014", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Although Web search techniques have greatly facilitate users' information seeking, there are still quite a lot of search sessions that cannot provide satisfactory results, which are more serious in Web image search scenarios. How to understand user intent from observed data is a fundamental issue and of paramount significance in improving image search performance. Previous research efforts mostly focus on discovering user intent either from clickthrough behavior in user search logs (e.g., Google), or from social data to facilitate vertical image search in a few limited social media platforms (e.g., Flickr). This article aims to combine the virtues of these two information sources to complement each other, that is, sensing and understanding users' interests from social media platforms and transferring this knowledge to rerank the image search results in general image search engines. Toward this goal, we first propose a novel social-sensed image search framework, where both social media and search engine are jointly considered. To effectively and efficiently leverage these two kinds of platforms, we propose an example-based user interest representation and modeling method, where we construct a hybrid graph from social media and propose a hybrid random-walk algorithm to derive the user-image interest graph. Moreover, we propose a social-sensed image reranking method to integrate the user-image interest graph from social media and search results from general image search engines to rerank the images by fusing their social relevance and visual relevance. We conducted extensive experiments on real-world data from Flickr and Google image search, and the results demonstrated that the proposed methods can significantly improve the social relevance of image search results while maintaining visual relevance well.", acknowledgement = ack-nhfb, articleno = "8", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Markov:2014:TQQ, author = "Ilya Markov and Fabio Crestani", title = "Theoretical, Qualitative, and Quantitative Analyses of Small-Document Approaches to Resource Selection", journal = j-TOIS, volume = "32", number = "2", pages = "9:1--9:??", month = apr, year = "2014", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2590975", ISSN = "1046-8188", bibdate = "Tue Apr 22 17:59:17 MDT 2014", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "In a distributed retrieval setup, resource selection is the problem of identifying and ranking relevant sources of information for a given user's query. For better usage of existing resource-selection techniques, it is desirable to know what the fundamental differences between them are and in what settings one is superior to others. However, little is understood still about the actual behavior of resource-selection methods. In this work, we focus on small-document approaches to resource selection that rank and select sources based on the ranking of their documents. We pose a number of research questions and approach them by three types of analyses. First, we present existing small-document techniques in a unified framework and analyze them theoretically. Second, we propose using a qualitative analysis to study the behavior of different small-document approaches. Third, we present a novel experimental methodology to evaluate small-document techniques and to validate the results of the qualitative analysis. This way, we answer the posed research questions and provide insights about small-document methods in general and about each technique in particular.", acknowledgement = ack-nhfb, articleno = "9", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Skaggs:2014:TMW, author = "Bradley Skaggs and Lise Getoor", title = "Topic Modeling for {Wikipedia} Link Disambiguation", journal = j-TOIS, volume = "32", number = "3", pages = "10:1--10:??", month = jun, year = "2014", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2633044", ISSN = "1046-8188", bibdate = "Wed Jul 16 17:20:38 MDT 2014", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Many articles in the online encyclopedia Wikipedia have hyperlinks to ambiguous article titles; these ambiguous links should be replaced with links to unambiguous articles, a process known as disambiguation. We propose a novel statistical topic model based on link text, which we refer to as the Link Text Topic Model (LTTM), that we use to suggest new link targets for ambiguous links. To evaluate our model, we describe a method for extracting ground truth for this link disambiguation task from edits made to Wikipedia in a specific time period. We use this ground truth to demonstrate the superiority of LTTM over other existing link- and content-based approaches to disambiguating links in Wikipedia. Finally, we build a web service that uses LTTM to make suggestions to human editors wanting to fix ambiguous links in Wikipedia.", acknowledgement = ack-nhfb, articleno = "10", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Yin:2014:LSI, author = "Hongzhi Yin and Bin Cui and Yizhou Sun and Zhiting Hu and Ling Chen", title = "{LCARS}: a Spatial Item Recommender System", journal = j-TOIS, volume = "32", number = "3", pages = "11:1--11:??", month = jun, year = "2014", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2629461", ISSN = "1046-8188", bibdate = "Wed Jul 16 17:20:38 MDT 2014", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Newly emerging location-based and event-based social network services provide us with a new platform to understand users' preferences based on their activity history. A user can only visit a limited number of venues/events and most of them are within a limited distance range, so the user-item matrix is very sparse, which creates a big challenge to the traditional collaborative filtering-based recommender systems. The problem becomes even more challenging when people travel to a new city where they have no activity information. In this article, we propose LCARS, a location-content-aware recommender system that offers a particular user a set of venues (e.g., restaurants and shopping malls) or events (e.g., concerts and exhibitions) by giving consideration to both personal interest and local preference. This recommender system can facilitate people's travel not only near the area in which they live, but also in a city that is new to them. Specifically, LCARS consists of two components: offline modeling and online recommendation. The offline modeling part, called LCA-LDA, is designed to learn the interest of each individual user and the local preference of each individual city by capturing item cooccurrence patterns and exploiting item contents. The online recommendation part takes a querying user along with a querying city as input, and automatically combines the learned interest of the querying user and the local preference of the querying city to produce the top- k recommendations. To speed up the online process, a scalable query processing technique is developed by extending both the Threshold Algorithm (TA) and TA-approximation algorithm. We evaluate the performance of our recommender system on two real datasets, that is, DoubanEvent and Foursquare, and one large-scale synthetic dataset. The results show the superiority of LCARS in recommending spatial items for users, especially when traveling to new cities, in terms of both effectiveness and efficiency. Besides, the experimental analysis results also demonstrate the excellent interpretability of LCARS.", acknowledgement = ack-nhfb, articleno = "11", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Laere:2014:GWD, author = "Olivier {Van Laere} and Steven Schockaert and Vlad Tanasescu and Bart Dhoedt and Christopher B. Jones", title = "Georeferencing {Wikipedia} Documents Using Data from Social Media Sources", journal = j-TOIS, volume = "32", number = "3", pages = "12:1--12:??", month = jun, year = "2014", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2629685", ISSN = "1046-8188", bibdate = "Wed Jul 16 17:20:38 MDT 2014", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Social media sources such as Flickr and Twitter continuously generate large amounts of textual information (tags on Flickr and short messages on Twitter). This textual information is increasingly linked to geographical coordinates, which makes it possible to learn how people refer to places by identifying correlations between the occurrence of terms and the locations of the corresponding social media objects. Recent work has focused on how this potentially rich source of geographic information can be used to estimate geographic coordinates for previously unseen Flickr photos or Twitter messages. In this article, we extend this work by analysing to what extent probabilistic language models trained on Flickr and Twitter can be used to assign coordinates to Wikipedia articles. Our results show that exploiting these language models substantially outperforms both (i) classical gazetteer-based methods (in particular, using Yahoo! Placemaker and Geonames) and (ii) language modelling approaches trained on Wikipedia alone. This supports the hypothesis that social media are important sources of geographic information, which are valuable beyond the scope of individual applications.", acknowledgement = ack-nhfb, articleno = "12", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Brisaboa:2014:XEX, author = "Nieves R. Brisaboa and Ana Cerdeira-Pena and Gonzalo Navarro", title = "{XXS}: Efficient {XPath} Evaluation on Compressed {XML} Documents", journal = j-TOIS, volume = "32", number = "3", pages = "13:1--13:??", month = jun, year = "2014", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2629554", ISSN = "1046-8188", bibdate = "Wed Jul 16 17:20:38 MDT 2014", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The eXtensible Markup Language (XML) is acknowledged as the de facto standard for semistructured data representation and data exchange on the Web and many other scenarios. A well-known shortcoming of XML is its verbosity, which increases manipulation, transmission, and processing costs. Various structure-blind and structure-conscious compression techniques can be applied to XML, and some are even access-friendly, meaning that the documents can be efficiently accessed in compressed form. Direct access is necessary to implement the query languages XPath and XQuery, which are the standard ones to exploit the expressiveness of XML. While a good deal of theoretical and practical proposals exist to solve XPath/XQuery operations on XML, only a few ones are well integrated with a compression format that supports the required access operations on the XML data. In this work we go one step further and design a compression format for XML collections that boosts the performance of XPath queries on the data. This is done by designing compressed representations of the XML data that support some complex operations apart from just accessing the data, and those are exploited to solve key components of the XPath queries. Our system, called XXS, is aimed at XML collections containing natural language text, which are compressed to within 35\%--50\% of their original size while supporting a large subset of XPath operations in time competitive with, and many times outperforming, the best state-of-the-art systems that work on uncompressed representations.", acknowledgement = ack-nhfb, articleno = "13", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Awad:2014:CBV, author = "George Awad and Paul Over and Wessel Kraaij", title = "Content-Based Video Copy Detection Benchmarking at {TRECVID}", journal = j-TOIS, volume = "32", number = "3", pages = "14:1--14:??", month = jun, year = "2014", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2629531", ISSN = "1046-8188", bibdate = "Wed Jul 16 17:20:38 MDT 2014", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "This article presents an overview of the video copy detection benchmark which was run over a period of 4 years (2008--2011) as part of the TREC Video Retrieval (TRECVID) workshop series. The main contributions of the article include (i) an examination of the evolving design of the evaluation framework and its components (system tasks, data, measures); (ii) a high-level overview of results and best-performing approaches; and (iii) a discussion of lessons learned over the four years. The content-based copy detection (CCD) benchmark worked with a large collection of synthetic queries, which is atypical for TRECVID, as was the use of a normalized detection cost framework. These particular evaluation design choices are motivated and appraised.", acknowledgement = ack-nhfb, articleno = "14", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Zhang:2014:TPB, author = "Richong Zhang and Yongyi Mao", title = "Trust Prediction via Belief Propagation", journal = j-TOIS, volume = "32", number = "3", pages = "15:1--15:??", month = jun, year = "2014", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2629530", ISSN = "1046-8188", bibdate = "Wed Jul 16 17:20:38 MDT 2014", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The prediction of trust relationships in social networks plays an important role in the analytics of the networks. Although various link prediction algorithms for general networks may be adapted for this purpose, the recent notion of ``trust propagation'' has been shown to effectively capture the trust-formation mechanisms and resulted in an effective prediction algorithm. This article builds on the concept of trust propagation and presents a probabilistic trust propagation model. Our model exploits the modern framework of probabilistic graphical models, more specifically, factor graphs. Under this model, the trust prediction problem can be formulated as a statistical inference problem and we derive the belief propagation algorithm as a solver for trust prediction. The model and algorithm are tested using datasets from Epinions and Ciao, by which performance advantages over the previous algorithms are demonstrated.", acknowledgement = ack-nhfb, articleno = "15", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Mahdabi:2014:PQF, author = "Parvaz Mahdabi and Fabio Crestani", title = "Patent Query Formulation by Synthesizing Multiple Sources of Relevance Evidence", journal = j-TOIS, volume = "32", number = "4", pages = "16:1--16:??", month = oct, year = "2014", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2651363", ISSN = "1046-8188", bibdate = "Tue Oct 28 16:57:21 MDT 2014", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Patent prior art search is a task in patent retrieval with the goal of finding documents which describe prior art work related to a query patent. A query patent is a full patent application composed of hundreds of terms which does not represent a single focused information need. Fortunately, other relevance evidence sources (i.e., classification tags and bibliographical data) provide additional details about the underlying information need. In this article, we propose a unified framework that integrates multiple relevance evidence components for query formulation. We first build a query model from the textual fields of a query patent. To overcome the term mismatch, we expand this initial query model with the term distribution of documents in the citation graph, modeling old and recent domain terminology. We build an IPC lexicon and perform query expansion using this lexicon incorporating proximity information. We performed an empirical evaluation on two patent datasets. Our results show that employing the temporal features of documents has a precision enhancing effect, while query expansion using IPC lexicon improves the recall of the final rank list.", acknowledgement = ack-nhfb, articleno = "16", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Forsati:2014:MFE, author = "Rana Forsati and Mehrdad Mahdavi and Mehrnoush Shamsfard and Mohamed Sarwat", title = "Matrix Factorization with Explicit Trust and Distrust Side Information for Improved Social Recommendation", journal = j-TOIS, volume = "32", number = "4", pages = "17:1--17:??", month = oct, year = "2014", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2641564", ISSN = "1046-8188", bibdate = "Tue Oct 28 16:57:21 MDT 2014", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "With the advent of online social networks, recommender systems have became crucial for the success of many online applications/services due to their significance role in tailoring these applications to user-specific needs or preferences. Despite their increasing popularity, in general, recommender systems suffer from data sparsity and cold-start problems. To alleviate these issues, in recent years, there has been an upsurge of interest in exploiting social information such as trust relations among users along with the rating data to improve the performance of recommender systems. The main motivation for exploiting trust information in the recommendation process stems from the observation that the ideas we are exposed to and the choices we make are significantly influenced by our social context. However, in large user communities, in addition to trust relations, distrust relations also exist between users. For instance, in Epinions, the concepts of personal ``web of trust'' and personal ``block list'' allow users to categorize their friends based on the quality of reviews into trusted and distrusted friends, respectively. Hence, it will be interesting to incorporate this new source of information in recommendation as well. In contrast to the incorporation of trust information in recommendation which is thriving, the potential of explicitly incorporating distrust relations is almost unexplored. In this article, we propose a matrix factorization-based model for recommendation in social rating networks that properly incorporates both trust and distrust relationships aiming to improve the quality of recommendations and mitigate the data sparsity and cold-start users issues. Through experiments on the Epinions dataset, we show that our new algorithm outperforms its standard trust-enhanced or distrust-enhanced counterparts with respect to accuracy, thereby demonstrating the positive effect that incorporation of explicit distrust information can have on recommender systems.", acknowledgement = ack-nhfb, articleno = "17", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Lu:2014:BSI, author = "Shiyang Lu and Tao Mei and Jingdong Wang and Jian Zhang and Zhiyong Wang and Shipeng Li", title = "Browse-to-Search: Interactive Exploratory Search with Visual Entities", journal = j-TOIS, volume = "32", number = "4", pages = "18:1--18:??", month = oct, year = "2014", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2630420", ISSN = "1046-8188", bibdate = "Tue Oct 28 16:57:21 MDT 2014", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "With the development of image search technology, users are no longer satisfied with searching for images using just metadata and textual descriptions. Instead, more search demands are focused on retrieving images based on similarities in their contents (textures, colors, shapes etc.). Nevertheless, one image may deliver rich or complex content and multiple interests. Sometimes users do not sufficiently define or describe their seeking demands for images even when general search interests appear, owing to a lack of specific knowledge to express their intents. A new form of information seeking activity, referred to as exploratory search, is emerging in the research community, which generally combines browsing and searching content together to help users gain additional knowledge and form accurate queries, thereby assisting the users with their seeking and investigation activities. However, there have been few attempts at addressing integrated exploratory search solutions when image browsing is incorporated into the exploring loop. In this work, we investigate the challenges of understanding users' search interests from the images being browsed and infer their actual search intentions. We develop a novel system to explore an effective and efficient way for allowing users to seamlessly switch between browse and search processes, and naturally complete visual-based exploratory search tasks. The system, called Browse-to-Search enables users to specify their visual search interests by circling any visual objects in the webpages being browsed, and then the system automatically forms the visual entities to represent users' underlying intent. One visual entity is not limited by the original image content, but also encapsulated by the textual-based browsing context and the associated heterogeneous attributes. We use large-scale image search technology to find the associated textual attributes from the repository. Users can then utilize the encapsulated visual entities to complete search tasks. The Browse-to-Search system is one of the first attempts to integrate browse and search activities for a visual-based exploratory search, which is characterized by four unique properties: (1) in session-searching is performed during browsing session and search results naturally accompany with browsing content; (2) in context-the pages being browsed provide text-based contextual cues for searching; (3) in focus-users can focus on the visual content of interest without worrying about the difficulties of query formulation, and visual entities will be automatically formed; and (4) intuitiveness-a touch and visual search-based user interface provides a natural user experience. We deploy the Browse-to-Search system on tablet devices and evaluate the system performance using millions of images. We demonstrate that it is effective and efficient in facilitating the user's exploratory search compared to the conventional image search methods and, more importantly, provides users with more robust results to satisfy their exploring experience.", acknowledgement = ack-nhfb, articleno = "18", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Ture:2014:ERS, author = "Ferhan Ture and Jimmy Lin", title = "Exploiting Representations from Statistical Machine Translation for Cross-Language Information Retrieval", journal = j-TOIS, volume = "32", number = "4", pages = "19:1--19:??", month = oct, year = "2014", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2644807", ISSN = "1046-8188", bibdate = "Tue Oct 28 16:57:21 MDT 2014", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "This work explores how internal representations of modern statistical machine translation systems can be exploited for cross-language information retrieval. We tackle two core issues that are central to query translation: how to exploit context to generate more accurate translations and how to preserve ambiguity that may be present in the original query, thereby retaining a diverse set of translation alternatives. These two considerations are often in tension since ambiguity in natural language is typically resolved by exploiting context, but effective retrieval requires striking the right balance. We propose two novel query translation approaches: the grammar-based approach extracts translation probabilities from translation grammars, while the decoder-based approach takes advantage of n -best translation hypotheses. Both are context-sensitive, in contrast to a baseline context-insensitive approach that uses bilingual dictionaries for word-by-word translation. Experimental results show that by ``opening up'' modern statistical machine translation systems, we can access intermediate representations that yield high retrieval effectiveness. By combining evidence from multiple sources, we demonstrate significant improvements over competitive baselines on standard cross-language information retrieval test collections. In addition to effectiveness, the efficiency of our techniques are explored as well.", acknowledgement = ack-nhfb, articleno = "19", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Raman:2014:UID, author = "Karthik Raman and Paul N. Bennett and Kevyn Collins-Thompson", title = "Understanding Intrinsic Diversity in {Web} Search: Improving Whole-Session Relevance", journal = j-TOIS, volume = "32", number = "4", pages = "20:1--20:??", month = oct, year = "2014", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2629553", ISSN = "1046-8188", bibdate = "Tue Oct 28 16:57:21 MDT 2014", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Current research on Web search has focused on optimizing and evaluating single queries. However, a significant fraction of user queries are part of more complex tasks [Jones and Klinkner 2008] which span multiple queries across one or more search sessions [Liu and Belkin 2010; Kotov et al. 2011]. An ideal search engine would not only retrieve relevant results for a user's particular query but also be able to identify when the user is engaged in a more complex task and aid the user in completing that task [Morris et al. 2008; Agichtein et al. 2012]. Toward optimizing whole-session or task relevance, we characterize and address the problem of intrinsic diversity (ID) in retrieval [Radlinski et al. 2009], a type of complex task that requires multiple interactions with current search engines. Unlike existing work on extrinsic diversity [Carbonell and Goldstein 1998; Zhai et al. 2003; Chen and Karger 2006] that deals with ambiguity in intent across multiple users, ID queries often have little ambiguity in intent but seek content covering a variety of aspects on a shared theme. In such scenarios, the underlying needs are typically exploratory, comparative, or breadth-oriented in nature. We identify and address three key problems for ID retrieval: identifying authentic examples of ID tasks from post-hoc analysis of behavioral signals in search logs; learning to identify initiator queries that mark the start of an ID search task; and given an initiator query, predicting which content to prefetch and rank.", acknowledgement = ack-nhfb, articleno = "20", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Wang:2014:CDS, author = "Jianguo Wang and Eric Lo and Man Lung Yiu and Jiancong Tong and Gang Wang and Xiaoguang Liu", title = "Cache Design of {SSD}-Based Search Engine Architectures: an Experimental Study", journal = j-TOIS, volume = "32", number = "4", pages = "21:1--21:??", month = oct, year = "2014", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2661629", ISSN = "1046-8188", bibdate = "Tue Oct 28 16:57:21 MDT 2014", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Caching is an important optimization in search engine architectures. Existing caching techniques for search engine optimization are mostly biased towards the reduction of random accesses to disks, because random accesses are known to be much more expensive than sequential accesses in traditional magnetic hard disk drive (HDD). Recently, solid-state drive (SSD) has emerged as a new kind of secondary storage medium, and some search engines like Baidu have already used SSD to completely replace HDD in their infrastructure. One notable property of SSD is that its random access latency is comparable to its sequential access latency. Therefore, the use of SSDs to replace HDDs in a search engine infrastructure may void the cache management of existing search engines. In this article, we carry out a series of empirical experiments to study the impact of SSD on search engine cache management. Based on the results, we give insights to practitioners and researchers on how to adapt the infrastructure and caching policies for SSD-based search engines.", acknowledgement = ack-nhfb, articleno = "21", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Bennett:2015:OSI, author = "Paul N. Bennett and Diane Kelly and Ryen W. White and Yi Zhang", title = "Overview of the Special Issue on Contextual Search and Recommendation", journal = j-TOIS, volume = "33", number = "1", pages = "1:1--1:??", month = mar, year = "2015", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2691351", ISSN = "1046-8188", bibdate = "Tue Mar 17 18:01:38 MDT 2015", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, articleno = "1e", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Cole:2015:UAP, author = "Michael J. Cole and Chathra Hendahewa and Nicholas J. Belkin and Chirag Shah", title = "User Activity Patterns During Information Search", journal = j-TOIS, volume = "33", number = "1", pages = "1:1--1:??", month = mar, year = "2015", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2699656", ISSN = "1046-8188", bibdate = "Tue Mar 17 18:01:38 MDT 2015", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Personalization of support for information seeking depends crucially on the information retrieval system's knowledge of the task that led the person to engage in information seeking. Users work during information search sessions to satisfy their task goals, and their activity is not random. To what degree are there patterns in the user activity during information search sessions? Do activity patterns reflect the user's situation as the user moves through the search task under the influence of his or her task goal? Do these patterns reflect aspects of different types of information-seeking tasks? Could such activity patterns identify contexts within which information seeking takes place? To investigate these questions, we model sequences of user behaviors in two independent user studies of information search sessions (N = 32 users, 128 sessions, and N = 40 users, 160 sessions). Two representations of user activity patterns are used. One is based on the sequences of page use; the other is based on a cognitive representation of information acquisition derived from eye movement patterns in service of the reading process. One of the user studies considered journalism work tasks; the other concerned background research in genomics using search tasks taken from the TREC Genomics Track. The search tasks differed in basic dimensions of complexity, specificity, and the type of information product (intellectual or factual) needed to achieve the overall task goal. The results show that similar patterns of user activity are observed at both the cognitive and page use levels. The activity patterns at both representation layers are able to distinguish between task types in similar ways and, to some degree, between tasks of different levels of difficulty. We explore relationships between the results and task difficulty and discuss the use of activity patterns to explore events within a search session. User activity patterns can be at least partially observed in server-side search logs. A focus on patterns of user activity sequences may contribute to the development of information systems that better personalize the user's search experience.", acknowledgement = ack-nhfb, articleno = "1", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Yuan:2015:WWW, author = "Quan Yuan and Gao Cong and Kaiqi Zhao and Zongyang Ma and Aixin Sun", title = "Who, Where, When, and What: a Nonparametric {Bayesian} Approach to Context-aware Recommendation and Search for {Twitter} Users", journal = j-TOIS, volume = "33", number = "1", pages = "2:1--2:??", month = mar, year = "2015", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2699667", ISSN = "1046-8188", bibdate = "Tue Mar 17 18:01:38 MDT 2015", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Micro-blogging services and location-based social networks, such as Twitter, Weibo, and Foursquare, enable users to post short messages with timestamps and geographical annotations. The rich spatial-temporal-semantic information of individuals embedded in these geo-annotated short messages provides exciting opportunity to develop many context-aware applications in ubiquitous computing environments. Example applications include contextual recommendation and contextual search. To obtain accurate recommendations and most relevant search results, it is important to capture users' contextual information (e.g., time and location) and to understand users' topical interests and intentions. While time and location can be readily captured by smartphones, understanding user's interests and intentions calls for effective methods in modeling user mobility behavior. Here, user mobility refers to who visits which place at what time for what activity. That is, user mobility behavior modeling must consider user (Who), spatial (Where), temporal (When), and activity (What) aspects. Unfortunately, no previous studies on user mobility behavior modeling have considered all of the four aspects jointly, which have complex interdependencies. In our preliminary study, we propose the first solution named W$^4$ (short for Who, Where, When, and What) to discover user mobility behavior from the four aspects. In this article, we further enhance W$^4$ and propose a nonparametric Bayesian model named EW$^4$ (short for Enhanced W$^4$ ). EW$^4$ requires no parameter tuning and achieves better results over W$^4$ in our experiments. Given some of the four aspects of a user (e.g., time), our model is able to infer information of the other aspects (e.g., location and topical words). Thus, our model has a variety of context-aware applications, particularly in contextual search and recommendation. Experimental results on two real-world datasets show that the proposed model is effective in discovering users' spatial-temporal topics. The model also significantly outperforms state-of-the-art baselines for various tasks including location prediction for tweets and requirement-aware location recommendation.", acknowledgement = ack-nhfb, articleno = "2", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Jarvelin:2015:TBI, author = "Kalervo J{\"a}rvelin and Pertti Vakkari and Paavo Arvola and Feza Baskaya and Anni J{\"a}rvelin and Jaana Kek{\"a}l{\"a}inen and Heikki Keskustalo and Sanna Kumpulainen and Miamaria Saastamoinen and Reijo Savolainen and Eero Sormunen", title = "Task-Based Information Interaction Evaluation: The Viewpoint of Program Theory", journal = j-TOIS, volume = "33", number = "1", pages = "3:1--3:??", month = mar, year = "2015", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2699660", ISSN = "1046-8188", bibdate = "Tue Mar 17 18:01:38 MDT 2015", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Evaluation is central in research and development of information retrieval (IR). In addition to designing and implementing new retrieval mechanisms, one must also show through rigorous evaluation that they are effective. A major focus in IR is IR mechanisms' capability of ranking relevant documents optimally for the users, given a query. Searching for information in practice involves searchers, however, and is highly interactive. When human searchers have been incorporated in evaluation studies, the results have often suggested that better ranking does not necessarily lead to better search task, or work task, performance. Therefore, it is not clear which system or interface features should be developed to improve the effectiveness of human task performance. In the present article, we focus on the evaluation of task-based information interaction (TBII). We give special emphasis to learning tasks to discuss TBII in more concrete terms. Information interaction is here understood as behavioral and cognitive activities related to task planning, searching information items, selecting between them, working with them, and synthesizing and reporting. These five generic activities contribute to task performance and outcome and can be supported by information systems. In an attempt toward task-based evaluation, we introduce program theory as the evaluation framework. Such evaluation can investigate whether a program consisting of TBII activities and tools works and how it works and, further, provides a causal description of program (in)effectiveness. Our goal in the present article is to structure TBII on the basis of the five generic activities and consider the evaluation of each activity using the program theory framework. Finally, we combine these activity-based program theories in an overall evaluation framework for TBII. Such an evaluation is complex due to the large number of factors affecting information interaction. Instead of presenting tested program theories, we illustrate how the evaluation of TBII should be accomplished using the program theory framework in the evaluation of systems and behaviors, and their interactions, comprehensively in context.", acknowledgement = ack-nhfb, articleno = "3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Alhindi:2015:PBS, author = "Azhar Alhindi and Udo Kruschwitz and Chris Fox and M-Dyaa Albakour", title = "Profile-Based Summarisation for {Web} Site Navigation", journal = j-TOIS, volume = "33", number = "1", pages = "4:1--4:??", month = mar, year = "2015", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2699661", ISSN = "1046-8188", bibdate = "Tue Mar 17 18:01:38 MDT 2015", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Information systems that utilise contextual information have the potential of helping a user identify relevant information more quickly and more accurately than systems that work the same for all users and contexts. Contextual information comes in a variety of types, often derived from records of past interactions between a user and the information system. It can be individual or group based. We are focusing on the latter, harnessing the search behaviour of cohorts of users, turning it into a domain model that can then be used to assist other users of the same cohort. More specifically, we aim to explore how such a domain model is best utilised for profile-biased summarisation of documents in a navigation scenario in which such summaries can be displayed as hover text as a user moves the mouse over a link. The main motivation is to help a user find relevant documents more quickly. Given the fact that the Web in general has been studied extensively already, we focus our attention on Web sites and similar document collections. Such collections can be notoriously difficult to search or explore. The process of acquiring the domain model is not a research interest here; we simply adopt a biologically inspired method that resembles the idea of ant colony optimisation. This has been shown to work well in a variety of application areas. The model can be built in a continuous learning cycle that exploits search patterns as recorded in typical query log files. Our research explores different summarisation techniques, some of which use the domain model and some that do not. We perform task-based evaluations of these different techniques-thus of the impact of the domain model and profile-biased summarisation-in the context of Web site navigation.", acknowledgement = ack-nhfb, articleno = "4", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Chuklin:2015:CAI, author = "Aleksandr Chuklin and Anne Schuth and Ke Zhou and Maarten {De Rijke}", title = "A Comparative Analysis of Interleaving Methods for Aggregated Search", journal = j-TOIS, volume = "33", number = "2", pages = "5:1--5:??", month = feb, year = "2015", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2668120", ISSN = "1046-8188", bibdate = "Fri Mar 6 09:56:29 MST 2015", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "A result page of a modern search engine often goes beyond a simple list of ``10 blue links.'' Many specific user needs (e.g., News, Image, Video) are addressed by so-called aggregated or vertical search solutions: specially presented documents, often retrieved from specific sources, that stand out from the regular organic Web search results. When it comes to evaluating ranking systems, such complex result layouts raise their own challenges. This is especially true for so-called interleaving methods that have arisen as an important type of online evaluation: by mixing results from two different result pages, interleaving can easily break the desired Web layout in which vertical documents are grouped together, and hence hurt the user experience. We conduct an analysis of different interleaving methods as applied to aggregated search engine result pages. Apart from conventional interleaving methods, we propose two vertical-aware methods: one derived from the widely used Team-Draft Interleaving method by adjusting it in such a way that it respects vertical document groupings, and another based on the recently introduced Optimized Interleaving framework. We show that our proposed methods are better at preserving the user experience than existing interleaving methods while still performing well as a tool for comparing ranking systems. For evaluating our proposed vertical-aware interleaving methods, we use real-world click data as well as simulated clicks and simulated ranking systems.", acknowledgement = ack-nhfb, articleno = "5", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Bing:2015:WQR, author = "Lidong Bing and Wai Lam and Tak-Lam Wong and Shoaib Jameel", title = "{Web} Query Reformulation via Joint Modeling of Latent Topic Dependency and Term Context", journal = j-TOIS, volume = "33", number = "2", pages = "6:1--6:??", month = feb, year = "2015", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2699666", ISSN = "1046-8188", bibdate = "Fri Mar 6 09:56:29 MST 2015", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "An important way to improve users' satisfaction in Web search is to assist them by issuing more effective queries. One such approach is query reformulation, which generates new queries according to the current query issued by users. A common procedure for conducting reformulation is to generate some candidate queries first, then a scoring method is employed to assess these candidates. Currently, most of the existing methods are context based. They rely heavily on the context relation of terms in the history queries and cannot detect and maintain the semantic consistency of queries. In this article, we propose a graphical model to score queries. The proposed model exploits a latent topic space, which is automatically derived from the query log, to detect semantic dependency of terms in a query and dependency among topics. Meanwhile, the graphical model also captures the term context in the history query by skip-bigram and n-gram language models. In addition, our model can be easily extended to consider users' history search interests when we conduct query reformulation for different users. In the task of candidate query generation, we investigate a social tagging data resource-Delicious bookmark-to generate addition and substitution patterns that are employed as supplements to the patterns generated from query log data.", acknowledgement = ack-nhfb, articleno = "6", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Tian:2015:TTA, author = "Yonghong Tian and Mengren Qian and Tiejun Huang", title = "{TASC}: a Transformation-Aware Soft Cascading Approach for Multimodal Video Copy Detection", journal = j-TOIS, volume = "33", number = "2", pages = "7:1--7:??", month = feb, year = "2015", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2699662", ISSN = "1046-8188", bibdate = "Fri Mar 6 09:56:29 MST 2015", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "How to precisely and efficiently detect near-duplicate copies with complicated audiovisual transformations from a large-scale video database is a challenging task. To cope with this challenge, this article proposes a transformation-aware soft cascading (TASC) approach for multimodal video copy detection. Basically, our approach divides query videos into some categories and then for each category designs a transformation-aware chain to organize several detectors in a cascade structure. In each chain, efficient but simple detectors are placed in the forepart, whereas effective but complex detectors are located in the rear. To judge whether two videos are near-duplicates, a Detection-on-Copy-Units mechanism is introduced in the TASC, which makes the decision of copy detection depending on the similarity between their most similar fractions, called copy units (CUs), rather than the video-level similarity. Following this, we propose a CU search algorithm to find a pair of CUs from two videos and a CU-based localization algorithm to find the precise locations of their copy segments that are with the asserted CUs as the center. Moreover, to address the problem that the copies and noncopies are possibly linearly inseparable in the feature space, the TASC also introduces a flexible strategy, called soft decision boundary, to replace the single threshold strategy for each detector. Its basic idea is to automatically learn two thresholds for each detector to examine the easy-to-judge copies and noncopies, respectively, and meanwhile to train a nonlinear classifier to further check those hard-to-judge ones. Extensive experiments on three benchmark datasets showed that the TASC can achieve excellent copy detection accuracy and localization precision with a very high processing efficiency.", acknowledgement = ack-nhfb, articleno = "7", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Na:2015:TSD, author = "Seung-Hoon Na", title = "Two-Stage Document Length Normalization for Information Retrieval", journal = j-TOIS, volume = "33", number = "2", pages = "8:1--8:??", month = feb, year = "2015", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2699669", ISSN = "1046-8188", bibdate = "Fri Mar 6 09:56:29 MST 2015", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The standard approach for term frequency normalization is based only on the document length. However, it does not distinguish the verbosity from the scope, these being the two main factors determining the document length. Because the verbosity and scope have largely different effects on the increase in term frequency, the standard approach can easily suffer from insufficient or excessive penalization depending on the specific type of long document. To overcome these problems, this article proposes two-stage normalization by performing verbosity and scope normalization separately, and by employing different penalization functions. In verbosity normalization, each document is prenormalized by dividing the term frequency by the verbosity of the document. In scope normalization, an existing retrieval model is applied in a straightforward manner to the prenormalized document, finally leading us to formulate our proposed verbosity normalized (VN) retrieval model. Experimental results carried out on standard TREC collections demonstrate that the VN model leads to marginal but statistically significant improvements over standard retrieval models.", acknowledgement = ack-nhfb, articleno = "8", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Ah-Pine:2015:UVT, author = "Julien Ah-Pine and Gabriela Csurka and St{\'e}phane Clinchant", title = "Unsupervised Visual and Textual Information Fusion in {CBMIR} Using Graph-Based Methods", journal = j-TOIS, volume = "33", number = "2", pages = "9:1--9:??", month = feb, year = "2015", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2699668", ISSN = "1046-8188", bibdate = "Fri Mar 6 09:56:29 MST 2015", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Multimedia collections are more than ever growing in size and diversity. Effective multimedia retrieval systems are thus critical to access these datasets from the end-user perspective and in a scalable way. We are interested in repositories of image/text multimedia objects and we study multimodal information fusion techniques in the context of content-based multimedia information retrieval. We focus on graph-based methods, which have proven to provide state-of-the-art performances. We particularly examine two such methods: cross-media similarities and random-walk-based scores. From a theoretical viewpoint, we propose a unifying graph-based framework, which encompasses the two aforementioned approaches. Our proposal allows us to highlight the core features one should consider when using a graph-based technique for the combination of visual and textual information. We compare cross-media and random-walk-based results using three different real-world datasets. From a practical standpoint, our extended empirical analyses allow us to provide insights and guidelines about the use of graph-based methods for multimodal information fusion in content-based multimedia information retrieval.", acknowledgement = ack-nhfb, articleno = "9", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Anagnostopoulos:2015:SQC, author = "Aris Anagnostopoulos and Luca Becchetti and Ilaria Bordino and Stefano Leonardi and Ida Mele and Piotr Sankowski", title = "Stochastic Query Covering for Fast Approximate Document Retrieval", journal = j-TOIS, volume = "33", number = "3", pages = "11:1--11:??", month = feb, year = "2015", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2699671", ISSN = "1046-8188", bibdate = "Fri Mar 6 09:56:30 MST 2015", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "We design algorithms that, given a collection of documents and a distribution over user queries, return a small subset of the document collection in such a way that we can efficiently provide high-quality answers to user queries using only the selected subset. This approach has applications when space is a constraint or when the query-processing time increases significantly with the size of the collection. We study our algorithms through the lens of stochastic analysis and prove that even though they use only a small fraction of the entire collection, they can provide answers to most user queries, achieving a performance close to the optimal. To complement our theoretical findings, we experimentally show the versatility of our approach by considering two important cases in the context of Web search. In the first case, we favor the retrieval of documents that are relevant to the query, whereas in the second case we aim for document diversification. Both the theoretical and the experimental analysis provide strong evidence of the potential value of query covering in diverse application scenarios.", acknowledgement = ack-nhfb, articleno = "11", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Nong:2015:ISS, author = "Ge Nong and Wai Hong Chan and Sheng Qing Hu and Yi Wu", title = "Induced Sorting Suffixes in External Memory", journal = j-TOIS, volume = "33", number = "3", pages = "12:1--12:??", month = feb, year = "2015", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2699665", ISSN = "1046-8188", bibdate = "Fri Mar 6 09:56:30 MST 2015", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "We present in this article an external memory algorithm, called disk SA-IS (DSA-IS), to exactly emulate the induced sorting algorithm SA-IS previously proposed for sorting suffixes in RAM. DSA-IS is a new disk-friendly method for sequentially retrieving the preceding character of a sorted suffix to induce the order of the preceding suffix. For a size $n$ string of a constant or integer alphabet, given the RAM capacity $ \Omega ((n W)^{0.5}) $, where $W$ is the size of each I/O buffer that is large enough to amortize the overhead of each access to disk, both the CPU time and peak disk use of DSA-IS are $ O(n)$. Our experimental study shows that on average, DSA-IS achieves the best time and space results of all of the existing external memory algorithms based on the induced sorting principle.", acknowledgement = ack-nhfb, articleno = "12", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Yang:2015:BHC, author = "Hui Yang", title = "Browsing Hierarchy Construction by Minimum Evolution", journal = j-TOIS, volume = "33", number = "3", pages = "13:1--13:??", month = mar, year = "2015", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2714574", ISSN = "1046-8188", bibdate = "Mon Mar 23 17:09:13 MDT 2015", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Hierarchies serve as browsing tools to access information in document collections. This article explores techniques to derive browsing hierarchies that can be used as an information map for task-based search. It proposes a novel minimum-evolution hierarchy construction framework that directly learns semantic distances from training data and from users to construct hierarchies. The aim is to produce globally optimized hierarchical structures by incorporating user-generated task specifications into the general learning framework. Both an automatic version of the framework and an interactive version are presented. A comparison with state-of-the-art systems and a user study jointly demonstrate that the proposed framework is highly effective.", acknowledgement = ack-nhfb, articleno = "13", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Pal:2015:MAR, author = "Aditya Pal", title = "Metrics and Algorithms for Routing Questions to User Communities", journal = j-TOIS, volume = "33", number = "3", pages = "14:1--14:??", month = mar, year = "2015", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2724706", ISSN = "1046-8188", bibdate = "Mon Mar 23 17:09:13 MDT 2015", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "An online community consists of a group of users who share a common interest, background, or experience, and their collective goal is to contribute toward the welfare of the community members. Several websites allow their users to create and manage niche communities, such as Yahoo! Groups, Facebook Groups, Google+ Circles, and WebMD Forums. These community services also exist within enterprises, such as IBM Connections. Question answering within these communities enables their members to exchange knowledge and information with other community members. However, the onus of finding the right community for question asking lies with an individual user. The overwhelming number of communities necessitates the need for a good question routing strategy so that new questions get routed to an appropriately focused community and thus get resolved in a reasonable time frame. In this article, we consider the novel problem of routing a question to the right community and propose a framework for selecting and ranking the relevant communities for a question. We propose several novel features for modeling the three main entities of the system: questions, users, and communities. We propose features such as language attributes, inclination to respond, user familiarity, and difficulty of a question; based on these features, we propose similarity metrics between the routed question and the system entities. We introduce a Cutoff-Aggregation ( CA ) algorithm that aggregates the entity similarity within a community to compute that community's relevance. We introduce two k -nearest-neighbor ( knn ) algorithms that are a natural instantiation of the CA algorithm, which are computationally efficient and evaluate several ranking algorithms over the aggregate similarity scores computed by the two knn algorithms. We propose clustering techniques to speed up our recommendation framework and show how pipelining can improve the model performance. We demonstrate the effectiveness of our framework on two large real-world datasets.", acknowledgement = ack-nhfb, articleno = "14", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Zhao:2015:GSB, author = "Wayne Xin Zhao and Xudong Zhang and Daniel Lemire and Dongdong Shan and Jian-Yun Nie and Hongfei Yan and Ji-Rong Wen", title = "A General {SIMD}-Based Approach to Accelerating Compression Algorithms", journal = j-TOIS, volume = "33", number = "3", pages = "15:1--15:??", month = mar, year = "2015", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2735629", ISSN = "1046-8188", bibdate = "Mon Mar 23 17:09:13 MDT 2015", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/datacompression.bib; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Compression algorithms are important for data-oriented tasks, especially in the era of ``Big Data.'' Modern processors equipped with powerful SIMD instruction sets provide us with an opportunity for achieving better compression performance. Previous research has shown that SIMD-based optimizations can multiply decoding speeds. Following these pioneering studies, we propose a general approach to accelerate compression algorithms. By instantiating the approach, we have developed several novel integer compression algorithms, called Group-Simple, Group-Scheme, Group-AFOR, and Group-PFD, and implemented their corresponding vectorized versions. We evaluate the proposed algorithms on two public TREC datasets, a Wikipedia dataset, and a Twitter dataset. With competitive compression ratios and encoding speeds, our SIMD-based algorithms outperform state-of-the-art nonvectorized algorithms with respect to decoding speeds.", acknowledgement = ack-nhfb, articleno = "15", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Han:2015:USC, author = "Shuguang Han and Zhen Yue and Daqing He", title = "Understanding and Supporting Cross-Device {Web} Search for Exploratory Tasks with Mobile Touch Interactions", journal = j-TOIS, volume = "33", number = "4", pages = "16:1--16:??", month = may, year = "2015", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2738036", ISSN = "1046-8188", bibdate = "Fri Aug 7 08:59:27 MDT 2015", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Mobile devices enable people to look for information at the moment when their information needs are triggered. While experiencing complex information needs that require multiple search sessions, users may utilize desktop computers to fulfill information needs started on mobile devices. Under the context of mobile-to-desktop web search, this article analyzes users' behavioral patterns and compares them to the patterns in desktop-to-desktop web search. Then, we examine several approaches of using Mobile Touch Interactions (MTIs) to infer relevant content so that such content can be used for supporting subsequent search queries on desktop computers. The experimental data used in this article was collected through a user study involving 24 participants and six properly designed cross-device web search tasks. Our experimental results show that (1) users' mobile-to-desktop search behaviors do significantly differ from desktop-to-desktop search behaviors in terms of information exploration, sense-making and repeated behaviors. (2) MTIs can be employed to predict the relevance of click-through documents, but applying document-level relevant content based on the predicted relevance does not improve search performance. (3) MTIs can also be used to identify the relevant text chunks at a fine-grained subdocument level. Such relevant information can achieve better search performance than the document-level relevant content. In addition, such subdocument relevant information can be combined with document-level relevance to further improve the search performance. However, the effectiveness of these methods relies on the sufficiency of click-through documents. (4) MTIs can also be obtained from the Search Engine Results Pages (SERPs). The subdocument feedbacks inferred from this set of MTIs even outperform the MTI-based subdocument feedback from the click-through documents.", acknowledgement = ack-nhfb, articleno = "16", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Kulkarni:2015:SSE, author = "Anagha Kulkarni and Jamie Callan", title = "Selective Search: Efficient and Effective Search of Large Textual Collections", journal = j-TOIS, volume = "33", number = "4", pages = "17:1--17:??", month = may, year = "2015", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2738035", ISSN = "1046-8188", bibdate = "Fri Aug 7 08:59:27 MDT 2015", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The traditional search solution for large collections divides the collection into subsets ( shards ), and processes the query against all shards in parallel ( exhaustive search ). The search cost and the computational requirements of this approach are often prohibitively high for organizations with few computational resources. This article investigates and extends an alternative: selective search, an approach that partitions the dataset based on document similarity to obtain topic-based shards, and searches only a few shards that are estimated to contain relevant documents for the query. We propose shard creation techniques that are scalable, efficient, self-reliant, and create topic-based shards with low variance in size, and high density of relevant documents. The experimental results demonstrate that the effectiveness of selective search is on par with that of exhaustive search, and the corresponding search costs are substantially lower with the former. Also, the majority of the queries perform as well or better with selective search. An oracle experiment that uses optimal shard ranking for a query indicates that selective search can outperform the effectiveness of exhaustive search. Comparison with a query optimization technique shows higher improvements in efficiency with selective search. The overall best efficiency is achieved when the two techniques are combined in an optimized selective search approach.", acknowledgement = ack-nhfb, articleno = "17", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{White:2015:BDB, author = "Ryen W. White and Eric Horvitz", title = "Belief Dynamics and Biases in {Web} Search", journal = j-TOIS, volume = "33", number = "4", pages = "18:1--18:??", month = may, year = "2015", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2746229", ISSN = "1046-8188", bibdate = "Fri Aug 7 08:59:27 MDT 2015", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "We investigate how beliefs about the efficacy of medical interventions are influenced by searchers' exposure to information on retrieved Web pages. We present a methodology for measuring participants' beliefs and confidence about the efficacy of treatment before, during, and after search episodes. We consider interventions studied in the Cochrane collection of meta-analyses. We extract related queries from search engine logs and consider the Cochrane assessments as ground truth. We analyze the dynamics of belief over time and show the influence of prior beliefs and confidence at the end of sessions. We present evidence for confirmation bias and for anchoring-and-adjustment during search and retrieval. Then, we build predictive models to estimate postsearch beliefs using sets of features about behavior and content. The findings provide insights about the influence of Web content on the beliefs of people and have implications for the design of search systems.", acknowledgement = ack-nhfb, articleno = "18", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Dang:2015:FFI, author = "Edward Kai Fung Dang and Robert Wing Pong Luk and James Allan", title = "Fast Forward Index Methods for Pseudo-Relevance Feedback Retrieval", journal = j-TOIS, volume = "33", number = "4", pages = "19:1--19:??", month = may, year = "2015", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2744199", ISSN = "1046-8188", bibdate = "Fri Aug 7 08:59:27 MDT 2015", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The inverted index is the dominant indexing method in information retrieval systems. It enables fast return of the list of all documents containing a given query term. However, for retrieval schemes involving query expansion, as in pseudo-relevance feedback (PRF), the retrieval time based on an inverted index increases linearly with the number of expansion terms. In this regard, we have examined the use of a forward index, which consists of the mapping of each document to its constituent terms. We propose a novel forward index-based reranking scheme to shorten the PRF retrieval time. In our method, a first retrieval of the original query is performed using an inverted index, and then a forward index is employed for the PRF part. We have studied several new forward indexes, including using a novel spstring data structure and the weighted variable bit-block compression (wvbc) signature. With modern hardware such as solid-state drives (SSDs) and sufficiently large main memory, forward index methods are particularly promising. We find that with the whole index stored in main memory, PRF retrieval using a spstring or wvbc forward index excels in time efficiency over an inverted index, being able to obtain the same levels of performance measures at shorter times.", acknowledgement = ack-nhfb, articleno = "19", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Yang:2015:QCM, author = "Hui Yang and Dongyi Guan and Sicong Zhang", title = "The Query Change Model: Modeling Session Search as a {Markov} Decision Process", journal = j-TOIS, volume = "33", number = "4", pages = "20:1--20:??", month = may, year = "2015", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2747874", ISSN = "1046-8188", bibdate = "Fri Aug 7 08:59:27 MDT 2015", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Modern information retrieval (IR) systems exhibit user dynamics through interactivity. These dynamic aspects of IR, including changes found in data, users, and systems, are increasingly being utilized in search engines. Session search is one such IR task-document retrieval within a session. During a session, a user constantly modifies queries to find documents that fulfill an information need. Existing IR techniques for assisting the user in this task are limited in their ability to optimize over changes, learn with a minimal computational footprint, and be responsive. This article proposes a novel query change retrieval model (QCM), which uses syntactic editing changes between consecutive queries, as well as the relationship between query changes and previously retrieved documents, to enhance session search. We propose modeling session search as a Markov decision process (MDP). We consider two agents in this MDP: the user agent and the search engine agent. The user agent's actions are query changes that we observe, and the search engine agent's actions are term weight adjustments as proposed in this work. We also investigate multiple query aggregation schemes and their effectiveness on session search. Experiments show that our approach is highly effective and outperforms top session search systems in TREC 2011 and TREC 2012.", acknowledgement = ack-nhfb, articleno = "20", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Cummins:2015:PUD, author = "Ronan Cummins and Jiaul H. Paik and Yuanhua Lv", title = "A {P{\'o}lya} Urn Document Language Model for Improved Information Retrieval", journal = j-TOIS, volume = "33", number = "4", pages = "21:1--21:??", month = may, year = "2015", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2746231", ISSN = "1046-8188", bibdate = "Fri Aug 7 08:59:27 MDT 2015", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The multinomial language model has been one of the most effective models of retrieval for more than a decade. However, the multinomial distribution does not model one important linguistic phenomenon relating to term dependency-that is, the tendency of a term to repeat itself within a document (i.e., word burstiness). In this article, we model document generation as a random process with reinforcement (a multivariate P{\'o}lya process) and develop a Dirichlet compound multinomial language model that captures word burstiness directly. We show that the new reinforced language model can be computed as efficiently as current retrieval models, and with experiments on an extensive set of TREC collections, we show that it significantly outperforms the state-of-the-art language model for a number of standard effectiveness metrics. Experiments also show that the tuning parameter in the proposed model is more robust than that in the multinomial language model. Furthermore, we develop a constraint for the verbosity hypothesis and show that the proposed model adheres to the constraint. Finally, we show that the new language model essentially introduces a measure closely related to idf, which gives theoretical justification for combining the term and document event spaces in tf-idf type schemes.", acknowledgement = ack-nhfb, articleno = "21", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Mayer:2015:IOV, author = "Julia M. Mayer and Quentin Jones and Starr Roxanne Hiltz", title = "Identifying Opportunities for Valuable Encounters: Toward Context-Aware Social Matching Systems", journal = j-TOIS, volume = "34", number = "1", pages = "1:1--1:??", month = oct, year = "2015", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2751557", ISSN = "1046-8188", bibdate = "Tue Feb 16 15:32:55 MST 2016", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Mobile social matching systems have the potential to transform the way we make new social ties, but only if we are able to overcome the many challenges that exist as to how systems can utilize contextual data to recommend interesting and relevant people to users and facilitate valuable encounters between strangers. This article outlines how context and mobility influence people's motivations to meet new people and presents innovative design concepts for mediating mobile encounters through context-aware social matching systems. Findings from two studies are presented. The first, a survey study (n {\SGMLequals} 117) explored the concept of contextual rarity of shared user attributes as a measure to improve desirability in mobile social matches. The second, an interview study (n {\SGMLequals} 58) explored people's motivations to meet others in various contexts. From these studies we derived a set of novel context-aware social matching concepts, including contextual sociability and familiarity as an indicator of opportune social context; contextual engagement as an indicator of opportune personal context; and contextual rarity, oddity, and activity partnering as an indicator of opportune relational context. The findings of these studies establish the importance of different contextual factors and frame the design space of context-aware social matching systems.", acknowledgement = ack-nhfb, articleno = "1", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Quan:2015:LDM, author = "Xiaojun Quan and Qifan Wang and Ying Zhang and Luo Si and Liu Wenyin", title = "Latent Discriminative Models for Social Emotion Detection with Emotional Dependency", journal = j-TOIS, volume = "34", number = "1", pages = "2:1--2:??", month = oct, year = "2015", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2749459", ISSN = "1046-8188", bibdate = "Tue Feb 16 15:32:55 MST 2016", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Sentiment analysis of such opinionated online texts as reviews and comments has received increasingly close attention, yet most of the work is intended to deal with the detection of authors' emotion. In contrast, this article presents our study of the social emotion detection problem, the objective of which is to identify the evoked emotions of readers by online documents such as news articles. A novel Latent Discriminative Model (LDM) is proposed for this task. LDM works by introducing intermediate hidden variables to model the latent structure of input text corpora. To achieve this, it defines a joint distribution over emotions and latent variables, conditioned on the observed text documents. Moreover, we assume that social emotions are not independent but correlated with one another, and the dependency of them is capable of providing additional guidance to LDM in the training process. The inclusion of this emotional dependency into LDM gives rise to a new Emotional Dependency-based LDM (eLDM). We evaluate the proposed models through a series of empirical evaluations on two real-world corpora of news articles. Experimental results verify the effectiveness of LDM and eLDM in social emotion detection.", acknowledgement = ack-nhfb, articleno = "2", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Yan:2015:DDS, author = "Su Yan and Xiaojun Wan", title = "Deep Dependency Substructure-Based Learning for Multidocument Summarization", journal = j-TOIS, volume = "34", number = "1", pages = "3:1--3:??", month = oct, year = "2015", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2766447", ISSN = "1046-8188", bibdate = "Tue Feb 16 15:32:55 MST 2016", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Most extractive style topic-focused multidocument summarization systems generate a summary by ranking textual units in multiple documents and extracting a proper subset of sentences biased to the given topic. Usually, the textual units are simply represented as sentences or n-grams, which do not carry deep syntactic and semantic information. This article presents a novel extractive topic-focused multidocument summarization framework. The framework proposes a new kind of more meaningful and informative units named frequent Deep Dependency Sub-Structure (DDSS) and a topic-sensitive Multi-Task Learning (MTL) model for frequent DDSS ranking. Given a document set, first, we parse all the sentences into deep dependency structures with a Head-driven Phrase Structure Grammar (HPSG) parser and mine the frequent DDSSs after semantic normalization. Then we employ a topic-sensitive MTL model to learn the importance of these frequent DDSSs. Finally, we exploit an Integer Linear Programming (ILP) formulation and use the frequent DDSSs as the essentials for summary extraction. Experimental results on two DUC datasets demonstrate that our proposed approach can achieve state-of-the-art performance. Both the DDSS information and the topic-sensitive MTL model are validated to be very helpful for topic-focused multidocument summarization.", acknowledgement = ack-nhfb, articleno = "3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Cui:2015:KGF, author = "Qing Cui and Bin Gao and Jiang Bian and Siyu Qiu and Hanjun Dai and Tie-Yan Liu", title = "{KNET}: a General Framework for Learning Word Embedding Using Morphological Knowledge", journal = j-TOIS, volume = "34", number = "1", pages = "4:1--4:??", month = oct, year = "2015", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2797137", ISSN = "1046-8188", bibdate = "Tue Feb 16 15:32:55 MST 2016", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Neural network techniques are widely applied to obtain high-quality distributed representations of words (i.e., word embeddings) to address text mining, information retrieval, and natural language processing tasks. Most recent efforts have proposed several efficient methods to learn word embeddings from context such that they can encode both semantic and syntactic relationships between words. However, it is quite challenging to handle unseen or rare words with insufficient context. Inspired by the study on the word recognition process in cognitive psychology, in this article, we propose to take advantage of seemingly less obvious but essentially important morphological knowledge to address these challenges. In particular, we introduce a novel neural network architecture called KNET that leverages both words' contextual information and morphological knowledge to learn word embeddings. Meanwhile, this new learning architecture is also able to benefit from noisy knowledge and balance between contextual information and morphological knowledge. Experiments on an analogical reasoning task and a word similarity task both demonstrate that the proposed KNET framework can greatly enhance the effectiveness of word embeddings.", acknowledgement = ack-nhfb, articleno = "4", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Baralis:2015:MSM, author = "Elena Baralis and Luca Cagliero and Alessandro Fiori and Paolo Garza", title = "{MWI-Sum}: a Multilingual Summarizer Based on Frequent Weighted Itemsets", journal = j-TOIS, volume = "34", number = "1", pages = "5:1--5:??", month = oct, year = "2015", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2809786", ISSN = "1046-8188", bibdate = "Tue Feb 16 15:32:55 MST 2016", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Multidocument summarization addresses the selection of a compact subset of highly informative sentences, i.e., the summary, from a collection of textual documents. To perform sentence selection, two parallel strategies have been proposed: (a) apply general-purpose techniques relying on data mining or information retrieval techniques, and/or (b) perform advanced linguistic analysis relying on semantics-based models (e.g., ontologies) to capture the actual sentence meaning. Since there is an increasing need for processing documents written in different languages, the attention of the research community has recently focused on summarizers based on strategy (a). This article presents a novel multilingual summarizer, namely MWI-Sum (Multilingual Weighted Itemset-based Summarizer), that exploits an itemset-based model to summarize collections of documents ranging over the same topic. Unlike previous approaches, it extracts frequent weighted itemsets tailored to the analyzed collection and uses them to drive the sentence selection process. Weighted itemsets represent correlations among multiple highly relevant terms that are neglected by previous approaches. The proposed approach makes minimal use of language-dependent analyses. Thus, it is easily applicable to document collections written in different languages. Experiments performed on benchmark and real-life collections, English-written and not, demonstrate that the proposed approach performs better than state-of-the-art multilingual document summarizers.", acknowledgement = ack-nhfb, articleno = "5", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Costa:2015:DRM, author = "Alberto Costa and Emanuele {Di Buccio} and Massimo Melucci", title = "A Document Retrieval Model Based on Digital Signal Filtering", journal = j-TOIS, volume = "34", number = "1", pages = "6:1--6:??", month = oct, year = "2015", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2809787", ISSN = "1046-8188", bibdate = "Tue Feb 16 15:32:55 MST 2016", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Information retrieval (IR) systems are designed, in general, to satisfy the information need of a user who expresses it by means of a query, by providing him with a subset of documents selected from a collection and ordered by decreasing relevance to the query. Such systems are based on IR models, which define how to represent the documents and the query, as well as how to determine the relevance of a document for a query. In this article, we present a new IR model based on concepts taken from both IR and digital signal processing (like Fourier analysis of signals and filtering). This allows the whole IR process to be seen as a physical phenomenon, where the query corresponds to a signal, the documents correspond to filters, and the determination of the relevant documents to the query is done by filtering that signal. Tests showed that the quality of the results provided by this IR model is comparable with the state-of-the-art.", acknowledgement = ack-nhfb, articleno = "6", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Tang:2016:TLI, author = "Jie Tang and Tiancheng Lou and Jon Kleinberg and Sen Wu", title = "Transfer Learning to Infer Social Ties across Heterogeneous Networks", journal = j-TOIS, volume = "34", number = "2", pages = "7:1--7:??", month = apr, year = "2016", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2746230", ISSN = "1046-8188", bibdate = "Mon Jun 20 18:55:33 MDT 2016", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Interpersonal ties are responsible for the structure of social networks and the transmission of information through these networks. Different types of social ties have essentially different influences on people. Awareness of the types of social ties can benefit many applications, such as recommendation and community detection. For example, our close friends tend to move in the same circles that we do, while our classmates may be distributed into different communities. Though a bulk of research has focused on inferring particular types of relationships in a specific social network, few publications systematically study the generalization of the problem of predicting social ties across multiple heterogeneous networks. In this work, we develop a framework referred to as TranFG for classifying the type of social relationships by learning across heterogeneous networks. The framework incorporates social theories into a factor graph model, which effectively improves the accuracy of predicting the types of social relationships in a target network by borrowing knowledge from a different source network. We also present several active learning strategies to further enhance the inferring performance. To scale up the model to handle really large networks, we design a distributed learning algorithm for the proposed model. We evaluate the proposed framework (TranFG) on six different networks and compare with several existing methods. TranFG clearly outperforms the existing methods on multiple metrics. For example, by leveraging information from a coauthor network with labeled advisor-advisee relationships, TranFG is able to obtain an F1-score of 90\% (8\%--28\% improvements over alternative methods) for predicting manager-subordinate relationships in an enterprise email network. The proposed model is efficient. It takes only a few minutes to train the proposed transfer model on large networks containing tens of thousands of nodes.", acknowledgement = ack-nhfb, articleno = "7", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Petersen:2016:PLD, author = "Casper Petersen and Jakob Grue Simonsen and Christina Lioma", title = "Power Law Distributions in Information Retrieval", journal = j-TOIS, volume = "34", number = "2", pages = "8:1--8:??", month = apr, year = "2016", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2816815", ISSN = "1046-8188", bibdate = "Mon Jun 20 18:55:33 MDT 2016", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Several properties of information retrieval (IR) data, such as query frequency or document length, are widely considered to be approximately distributed as a power law. This common assumption aims to focus on specific characteristics of the empirical probability distribution of such data (e.g., its scale-free nature or its long/fat tail). This assumption, however, may not be always true. Motivated by recent work in the statistical treatment of power law claims, we investigate two research questions: (i) To what extent do power law approximations hold for term frequency, document length, query frequency, query length, citation frequency, and syntactic unigram frequency? And (ii) what is the computational cost of replacing ad hoc power law approximations with more accurate distribution fitting? We study 23 TREC and 5 non-TREC datasets and compare the fit of power laws to 15 other standard probability distributions. We find that query frequency and 5 out of 24 term frequency distributions are best approximated by a power law. All remaining properties are better approximated by the Inverse Gaussian, Generalized Extreme Value, Negative Binomial, or Yule distribution. We also find the overhead of replacing power law approximations by more informed distribution fitting to be negligible, with potential gains to IR tasks like index compression or test collection generation for IR evaluation.", acknowledgement = ack-nhfb, articleno = "8", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Gomez-Rodriguez:2016:IEM, author = "Manuel Gomez-Rodriguez and Le Song and Nan Du and Hongyuan Zha and Bernhard Sch{\"o}lkopf", title = "Influence Estimation and Maximization in Continuous-Time Diffusion Networks", journal = j-TOIS, volume = "34", number = "2", pages = "9:1--9:??", month = apr, year = "2016", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2824253", ISSN = "1046-8188", bibdate = "Mon Jun 20 18:55:33 MDT 2016", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "If a piece of information is released from a set of media sites, can it spread, in 1 month, to a million web pages? Can we efficiently find a small set of media sites among millions that can maximize the spread of the information, in 1 month? The two problems are called influence estimation and maximization problems respectively, which are very challenging since both the time-sensitive nature of the problems and the issue of scalability need to be addressed simultaneously. In this article, we propose two algorithms for influence estimation in continuous-time diffusion networks. The first one uses continuous-time Markov chains to estimate influence exactly on networks with exponential, or, more generally, phase-type transmission functions, but does not scale to large-scale networks, and the second one is a highly efficient randomized algorithm, which estimates the influence of every node in a network with general transmission functions, $| \nu |$ nodes and $| \epsilon |$ edges to an accuracy of $\epsilon$ using $n = O(1 / \epsilon^2)$ randomizations and up to logarithmic factors $O( n | \epsilon |+ n | \nu |)$ computations. We then show that finding the set of most influential source nodes in a continuous time diffusion network is an NP-hard problem and develop an efficient greedy algorithm with provable near-optimal performance. When used as subroutines in the influence maximization algorithm, the exact influence estimation algorithm is guaranteed to find a set of $C$ nodes with an influence of at least $(1 - 1 / e ) {\rm OPT}$ and the randomized algorithm is guaranteed to find a set with an influence of at least $(1 - 1 / e ){\rm OPT} - 2 C \epsilon$, where ${\rm OPT}$ is the optimal value. Experiments on both synthetic and real-world data show that the proposed algorithms significantly improve over previous state-of-the-art methods in terms of the accuracy of the estimated influence and the quality of the selected nodes to maximize the influence, and the randomized algorithm can easily scale up to networks of millions of nodes.", acknowledgement = ack-nhfb, articleno = "9", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Song:2016:VTP, author = "Xuemeng Song and Zhao-Yan Ming and Liqiang Nie and Yi-Liang Zhao and Tat-Seng Chua", title = "Volunteerism Tendency Prediction via Harvesting Multiple Social Networks", journal = j-TOIS, volume = "34", number = "2", pages = "10:1--10:??", month = apr, year = "2016", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2832907", ISSN = "1046-8188", bibdate = "Mon Jun 20 18:55:33 MDT 2016", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Volunteers have always been extremely crucial and in urgent need for nonprofit organizations (NPOs) to sustain their continuing operations. However, it is expensive and time-consuming to recruit volunteers using traditional approaches. In the Web 2.0 era, abundant and ubiquitous social media data opens a door to the possibility of automatic volunteer identification. In this article, we aim to fully explore this possibility by proposing a scheme that is able to predict users' volunteerism tendency from user-generated contents collected from multiple social networks based on a conceptual volunteering decision model. We conducted comprehensive experiments to investigate the effectiveness of our proposed scheme and further discussed its generalizibility and extendability. This novel interdisciplinary research will potentially inspire more promising and important human-centered applications.", acknowledgement = ack-nhfb, articleno = "10", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Li:2016:TBI, author = "Qing Li and Yuanzhu Chen and Li Ling Jiang and Ping Li and Hsinchun Chen", title = "A Tensor-Based Information Framework for Predicting the Stock Market", journal = j-TOIS, volume = "34", number = "2", pages = "11:1--11:??", month = apr, year = "2016", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2838731", ISSN = "1046-8188", bibdate = "Mon Jun 20 18:55:33 MDT 2016", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "To study the influence of information on the behavior of stock markets, a common strategy in previous studies has been to concatenate the features of various information sources into one compound feature vector, a procedure that makes it more difficult to distinguish the effects of different information sources. We maintain that capturing the intrinsic relations among multiple information sources is important for predicting stock trends. The challenge lies in modeling the complex space of various sources and types of information and studying the effects of this information on stock market behavior. For this purpose, we introduce a tensor-based information framework to predict stock movements. Specifically, our framework models the complex investor information environment with tensors. A global dimensionality-reduction algorithm is used to capture the links among various information sources in a tensor, and a sequence of tensors is used to represent information gathered over time. Finally, a tensor-based predictive model to forecast stock movements, which is in essence a high-order tensor regression learning problem, is presented. Experiments performed on an entire year of data for China Securities Index stocks demonstrate that a trading system based on our framework outperforms the classic Top- N trading strategy and two state-of-the-art media-aware trading algorithms.", acknowledgement = ack-nhfb, articleno = "11", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Piao:2016:SFA, author = "Minghao Piao and Keun Ho Ryu", title = "Subspace Frequency Analysis-Based Field Indices Extraction for Electricity Customer Classification", journal = j-TOIS, volume = "34", number = "2", pages = "12:1--12:??", month = apr, year = "2016", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2858657", ISSN = "1046-8188", bibdate = "Mon Jun 20 18:55:33 MDT 2016", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "In electricity customer classification, the most important task is to avoid the curse of dimensionality problem, as the consumption diagrams have a large number of dimensions. To avoid the curse of dimensionality problem, field indices (load shape factor) are often used instead of consumption diagrams. Field indices are directly extracted from consumption diagrams according to a predefined formula. Previous studies show that the most important thing for defining such a formula is to find meaningful time intervals from consumption diagrams. However, the inconvenient thing is that there are still a lack of details to explain how to define such time intervals. In our study, we propose a data mining--based method named SFATIE to support the extraction of field indices. The performance of the proposed method is evaluated by comparing it with other dimensionality reduction methods during the classification. For the classification, most often we have used classification methods like C5.0, SVM, Neural Net, Bayes Net, and Logistic. The experimental results show that our method is better or close to other dimensionality reduction methods. In addition, the experimental results show that our proposed method can produce the good quality of field indices and that these indices can improve the performance of electricity customer classification.", acknowledgement = ack-nhfb, articleno = "12", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Cheng:2016:ELA, author = "Zhiyong Cheng and Jialie Shen", title = "On Effective Location-Aware Music Recommendation", journal = j-TOIS, volume = "34", number = "2", pages = "13:1--13:??", month = apr, year = "2016", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2846092", ISSN = "1046-8188", bibdate = "Mon Jun 20 18:55:33 MDT 2016", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Rapid advances in mobile devices and cloud-based music service now allow consumers to enjoy music anytime and anywhere. Consequently, there has been an increasing demand in studying intelligent techniques to facilitate context-aware music recommendation. However, one important context that is generally overlooked is user's venue, which often includes surrounding atmosphere, correlates with activities, and greatly influences the user's music preferences. In this article, we present a novel venue-aware music recommender system called VenueMusic to effectively identify suitable songs for various types of popular venues in our daily lives. Toward this goal, a Location-aware Topic Model (LTM) is proposed to (i) mine the common features of songs that are suitable for a venue type in a latent semantic space and (ii) represent songs and venue types in the shared latent space, in which songs and venue types can be directly matched. It is worth mentioning that to discover meaningful latent topics with the LTM, a Music Concept Sequence Generation (MCSG) scheme is designed to extract effective semantic representations for songs. An extensive experimental study based on two large music test collections demonstrates the effectiveness of the proposed topic model and MCSG scheme. The comparisons with state-of-the-art music recommender systems demonstrate the superior performance of VenueMusic system on recommendation accuracy by associating venue and music contents using a latent semantic space. This work is a pioneering study on the development of a venue-aware music recommender system. The results show the importance of considering the influence of venue types in the development of context-aware music recommender systems.", acknowledgement = ack-nhfb, articleno = "13", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Papadopoulos:2016:OSI, author = "Symeon Papadopoulos and Kalina Bontcheva and Eva Jaho and Mihai Lupu and Carlos Castillo", title = "Overview of the Special Issue on Trust and Veracity of Information in Social Media", journal = j-TOIS, volume = "34", number = "3", pages = "14:1--14:??", month = may, year = "2016", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2870630", ISSN = "1046-8188", bibdate = "Mon Jun 20 18:55:34 MDT 2016", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, articleno = "14", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Webb:2016:DWP, author = "Helena Webb and Pete Burnap and Rob Procter and Omer Rana and Bernd Carsten Stahl and Matthew Williams and William Housley and Adam Edwards and Marina Jirotka", title = "Digital Wildfires: Propagation, Verification, Regulation, and Responsible Innovation", journal = j-TOIS, volume = "34", number = "3", pages = "15:1--15:??", month = may, year = "2016", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2893478", ISSN = "1046-8188", bibdate = "Mon Jun 20 18:55:34 MDT 2016", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Social media platforms provide an increasingly popular means for individuals to share content online. Whilst this produces undoubted societal benefits, the ability for content to be spontaneously posted and reposted creates an ideal environment for rumour and false/malicious information to spread rapidly. When this occurs it can cause significant harm and can be characterised as a ``digital wildfire.'' In this article, we demonstrate that the propagation and regulation of digital wildfires form important topics for research and conduct an overview of existing work in this area. We outline the relevance of a range of work from the computational and social sciences, including a series of insights into the propagation of rumour and false/malicious information. We argue that significant research gaps remain-for instance, there is an absence of systematic studies on the effects of digital wildfires and there is a need to combine empirical research with a consideration of how the responsible governance of social media can be determined. We propose an agenda for research that establishes a methodology to explore in full the propagation and regulation of unverified content on social media. This agenda promotes high-quality interdisciplinary research that will also inform policy debates.", acknowledgement = ack-nhfb, articleno = "15", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Middleton:2016:GGS, author = "Stuart E. Middleton and Vadims Krivcovs", title = "Geoparsing and Geosemantics for Social Media: Spatiotemporal Grounding of Content Propagating Rumors to Support Trust and Veracity Analysis during Breaking News", journal = j-TOIS, volume = "34", number = "3", pages = "16:1--16:??", month = may, year = "2016", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2842604", ISSN = "1046-8188", bibdate = "Mon Jun 20 18:55:34 MDT 2016", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "In recent years, there has been a growing trend to use publicly available social media sources within the field of journalism. Breaking news has tight reporting deadlines, measured in minutes not days, but content must still be checked and rumors verified. As such, journalists are looking at automated content analysis to prefilter large volumes of social media content prior to manual verification. This article describes a real-time social media analytics framework for journalists. We extend our previously published geoparsing approach to improve its scalability and efficiency. We develop and evaluate a novel approach to geosemantic feature extraction, classifying evidence in terms of situatedness, timeliness, confirmation, and validity. Our approach works for new unseen news topics. We report results from four experiments using five Twitter datasets crawled during different English-language news events. One of our datasets is the standard TREC 2012 microblog corpus. Our classification results are promising, with F1 scores varying by class from 0.64 to 0.92 for unseen event types. We lastly report results from two case studies during real-world news stories, showcasing different ways our system can assist journalists filter and cross-check content as they examine the trust and veracity of content and sources.", acknowledgement = ack-nhfb, articleno = "16", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Hamdi:2016:TTI, author = "Sana Hamdi and Alda Lopes Gancarski and Amel Bouzeghoub and Sadok Ben Yahia", title = "{TISoN}: Trust Inference in Trust-Oriented Social Networks", journal = j-TOIS, volume = "34", number = "3", pages = "17:1--17:??", month = may, year = "2016", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2858791", ISSN = "1046-8188", bibdate = "Mon Jun 20 18:55:34 MDT 2016", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Trust systems represent a significant trend in decision support for social networks' service provision. The basic idea is to allow users to rate each other even without being direct neighbours. In this case, the purpose is to derive a trust score for a given user, which could be of help to decide whether to trust other users or not. In this article, we investigate the properties of trust propagation within social networks, based on the notion of transitivity, and we introduce the TISoN model to generate and evaluate Trust Inference within online Social Networks. To do so, ( i ) we develop a novel TPS algorithm for Trust Path Searching where we define neighbours' priority based on their direct trust degrees, and then select trusted paths while controlling the path length; and, ( ii ) we develop different TIM algorithms for Trust Inference Measuring and build a trust network. In addition, we analyse existing algorithms and we demonstrate that our proposed model better computes transitive trust values than do the existing models. We conduct extensive experiments on a real online social network dataset, Advogato. Experimental results show that our work is scalable and generates better results than do the pioneering approaches of the literature.", acknowledgement = ack-nhfb, articleno = "17", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Zhang:2016:MOS, author = "Huiling Zhang and Md Abdul Alim and Xiang Li and My T. Thai and Hien T. Nguyen", title = "Misinformation in Online Social Networks: Detect Them All with a Limited Budget", journal = j-TOIS, volume = "34", number = "3", pages = "18:1--18:??", month = may, year = "2016", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2885494", ISSN = "1046-8188", bibdate = "Mon Jun 20 18:55:34 MDT 2016", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Online social networks have become an effective and important social platform for communication, opinions exchange, and information sharing. However, they also make it possible for rapid and wide misinformation diffusion, which may lead to pernicious influences on individuals or society. Hence, it is extremely important and necessary to detect the misinformation propagation by placing monitors. In this article, we first define a general misinformation-detection problem for the case where the knowledge about misinformation sources is lacking, and show its equivalence to the influence-maximization problem in the reverse graph. Furthermore, considering node vulnerability, we aim to detect the misinformation reaching to a specific user. Therefore, we study a $\tau$-Monitor Placement problem for cases where partial knowledge of misinformation sources is available and prove its \#P complexity. We formulate a corresponding integer program, tackle exponential constraints, and propose a Minimum Monitor Set Construction (MMSC) algorithm, in which the cut-set$^2$ has been exploited in the estimation of reachability of node pairs. Moreover, we generalize the problem from a single target to multiple central nodes and propose another algorithm based on a Monte Carlo sampling technique. Extensive experiments on real-world networks show the effectiveness of proposed algorithms with respect to minimizing the number of monitors.", acknowledgement = ack-nhfb, articleno = "18", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Shtok:2016:QPP, author = "Anna Shtok and Oren Kurland and David Carmel", title = "Query Performance Prediction Using Reference Lists", journal = j-TOIS, volume = "34", number = "4", pages = "19:1--19:??", month = sep, year = "2016", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2926790", ISSN = "1046-8188", bibdate = "Mon Apr 3 11:29:18 MDT 2017", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The task of query performance prediction is to estimate the effectiveness of search performed in response to a query when no relevance judgments are available. We present a novel probabilistic analysis of the performance prediction task. The analysis gives rise to a general prediction framework that uses pseudo-effective or ineffective document lists that are retrieved in response to the query. These lists serve as reference to the result list at hand, the effectiveness of which we want to predict. We show that many previously proposed prediction methods can be explained using our framework. More generally, we shed new light on existing prediction methods and establish formal common grounds to seemingly different prediction approaches. In addition, we formally demonstrate the connection between prediction using reference lists and fusion of retrieved lists, and provide empirical support to this connection. Through an extensive empirical exploration, we study various factors that affect the quality of prediction using reference lists.", acknowledgement = ack-nhfb, articleno = "19", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Ibrahim:2016:CPL, author = "Muhammad Ibrahim and Mark Carman", title = "Comparing Pointwise and Listwise Objective Functions for Random-Forest-Based Learning-to-Rank", journal = j-TOIS, volume = "34", number = "4", pages = "20:1--20:??", month = sep, year = "2016", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2866571", ISSN = "1046-8188", bibdate = "Mon Apr 3 11:29:18 MDT 2017", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Current random-forest (RF)-based learning-to-rank (LtR) algorithms use a classification or regression framework to solve the ranking problem in a pointwise manner. The success of this simple yet effective approach coupled with the inherent parallelizability of the learning algorithm makes it a strong candidate for widespread adoption. In this article, we aim to better understand the effectiveness of RF-based rank-learning algorithms with a focus on the comparison between pointwise and listwise approaches. We introduce what we believe to be the first listwise version of an RF-based LtR algorithm. The algorithm directly optimizes an information retrieval metric of choice (in our case, NDCG) in a greedy manner. Direct optimization of the listwise objective functions is computationally prohibitive for most learning algorithms, but possible in RF since each tree maximizes the objective in a coordinate-wise fashion. Computational complexity of the listwise approach is higher than the pointwise counterpart; hence for larger datasets, we design a hybrid algorithm that combines a listwise objective in the early stages of tree construction and a pointwise objective in the latter stages. We also study the effect of the discount function of NDCG on the listwise algorithm. Experimental results on several publicly available LtR datasets reveal that the listwise/hybrid algorithm outperforms the pointwise approach on the majority (but not all) of the datasets. We then investigate several aspects of the two algorithms to better understand the inevitable performance tradeoffs. The aspects include examining an RF-based unsupervised LtR algorithm and comparing individual tree strength. Finally, we compare the the investigated RF-based algorithms with several other LtR algorithms.", acknowledgement = ack-nhfb, articleno = "20", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Do:2016:PMC, author = "Loc Do and Hady W. Lauw", title = "Probabilistic Models for Contextual Agreement in Preferences", journal = j-TOIS, volume = "34", number = "4", pages = "21:1--21:??", month = sep, year = "2016", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2854147", ISSN = "1046-8188", bibdate = "Mon Apr 3 11:29:18 MDT 2017", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The long-tail theory for consumer demand implies the need for more accurate personalization technologies to target items to the users who most desire them. A key tenet of personalization is the capacity to model user preferences. Most of the previous work on recommendation and personalization has focused primarily on individual preferences. While some focus on shared preferences between pairs of users, they assume that the same similarity value applies to all items. Here we investigate the notion of ``context,'' hypothesizing that while two users may agree on their preferences on some items, they may also disagree on other items. To model this, we design probabilistic models for the generation of rating differences between pairs of users across different items. Since this model also involves the estimation of rating differences on unseen items for the purpose of prediction, we further conduct a systematic analysis of matrix factorization and tensor factorization methods in this estimation, and propose a factorization model with a novel objective function of minimizing error in rating differences. Experiments on several real-life rating datasets show that our proposed model consistently yields context-specific similarity values that perform better on a prediction task than models relying on shared preferences.", acknowledgement = ack-nhfb, articleno = "21", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Miao:2016:TPF, author = "Jun Miao and Jimmy Xiangji Huang and Jiashu Zhao", title = "{TopPRF}: a Probabilistic Framework for Integrating Topic Space into Pseudo Relevance Feedback", journal = j-TOIS, volume = "34", number = "4", pages = "22:1--22:??", month = sep, year = "2016", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2956234", ISSN = "1046-8188", bibdate = "Mon Apr 3 11:29:18 MDT 2017", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Traditional pseudo relevance feedback (PRF) models choose top k feedback documents for query expansion and treat those documents equally. When k is determined, feedback terms are selected without considering the reliability of these documents for relevance. Because the performance of PRF is sensitive to the selection of feedback terms, noisy terms imported from these irrelevant documents or partially relevant documents will harm the final results extensively. Intuitively, terms in these documents should be considered less important for feedback term selection. Nonetheless, how to measure the reliability of feedback documents is a difficult problem. Recently, topic modeling has become more and more popular in the information retrieval (IR) area. In order to identify how reliable a feedback document is to be relevant, we attempt to adapt the topical information into PRF. However, topics are hard to be quantified and therefore the identification of topic is usually fuzzy. It is very challenging for integrating the obtained topical information effectively into IR and other text-processing-related areas. Current research work mainly focuses on mining relevant information from particular topics. This is extremely difficult when the boundaries of different topics are hard to define. In this article, we investigate a key factor of this problem, the topic number for topic modeling and how it makes topics ``fuzzy.'' To effectively and efficiently apply topical information, we propose a new probabilistic framework, ``TopPRF,'' and three models, TS-COS, TS-EU, and TS-Entropy, via integrating ``Topic Space'' (TS) information into pseudo relevance feedback. These methods discover how reliable a document is to be relevant through both term and topical information. When selecting feedback terms, candidate terms in more reliable feedback documents should obtain extra weights. Experimental results on various public collections justify that our proposed methods can significantly reduce the influence of ``fuzzy topics'' and obtain stable, good results over the strong baseline models. Our proposed probabilistic framework, TopPRF, and three topic-space-based models are capable of searching documents beyond traditional term matching only and provide a promising avenue for constructing better topic-space-based IR systems. Moreover, in-depth discussions and conclusions are made to help other researchers apply topical information effectively.", acknowledgement = ack-nhfb, articleno = "22", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Kharazmi:2016:EAW, author = "Sadegh Kharazmi and Falk Scholer and David Vallet and Mark Sanderson", title = "Examining Additivity and Weak Baselines", journal = j-TOIS, volume = "34", number = "4", pages = "23:1--23:??", month = sep, year = "2016", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2882782", ISSN = "1046-8188", bibdate = "Mon Apr 3 11:29:18 MDT 2017", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "We present a study of which baseline to use when testing a new retrieval technique. In contrast to past work, we show that measuring a statistically significant improvement over a weak baseline is not a good predictor of whether a similar improvement will be measured on a strong baseline. Sometimes strong baselines are made worse when a new technique is applied. We investigate whether conducting comparisons against a range of weaker baselines can increase confidence that an observed effect will also show improvements on a stronger baseline. Our results indicate that this is not the case --- at best, testing against a range of baselines means that an experimenter can be more confident that the new technique is unlikely to significantly harm a strong baseline. Examining recent past work, we present evidence that the information retrieval (IR) community continues to test against weak baselines. This is unfortunate as, in light of our experiments, we conclude that the only way to be confident that a new technique is a contribution is to compare it against nothing less than the state of the art.", acknowledgement = ack-nhfb, articleno = "23", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Luo:2016:MSU, author = "Xiangfeng Luo and Junyu Xuan and Jie Lu and Guangquan Zhang", title = "Measuring the Semantic Uncertainty of News Events for Evolution Potential Estimation", journal = j-TOIS, volume = "34", number = "4", pages = "24:1--24:??", month = sep, year = "2016", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2903719", ISSN = "1046-8188", bibdate = "Mon Apr 3 11:29:18 MDT 2017", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The evolution potential estimation of news events can support the decision making of both corporations and governments. For example, a corporation could manage its public relations crisis in a timely manner if a negative news event about this corporation is known with large evolution potential in advance. However, existing state-of-the-art methods are mainly based on time series historical data, which are not suitable for the news events with limited historical data and bursty properties. In this article, we propose a purely content-based method to estimate the evolution potential of the news events. The proposed method considers a news event at a given time point as a system composed of different keywords, and the uncertainty of this system is defined and measured as the Semantic Uncertainty of this news event. At the same time, an uncertainty space is constructed with two extreme states: the most uncertain state and the most certain state. We believe that the Semantic Uncertainty has correlation with the content evolution of the news events, so it can be used to estimate the evolution potential of the news events. In order to verify the proposed method, we present detailed experimental setups and results measuring the correlation of the Semantic Uncertainty with the Content Change of news events using collected news events data. The results show that the correlation does exist and is stronger than the correlation of value from the time-series-based method with the Content Change. Therefore, we can use the Semantic Uncertainty to estimate the evolution potential of news events.", acknowledgement = ack-nhfb, articleno = "24", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Cai:2016:DQA, author = "Fei Cai and Ridho Reinanda and Maarten {De Rijke}", title = "Diversifying Query Auto-Completion", journal = j-TOIS, volume = "34", number = "4", pages = "25:1--25:??", month = sep, year = "2016", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2910579", ISSN = "1046-8188", bibdate = "Mon Apr 3 11:29:18 MDT 2017", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Query auto-completion assists web search users in formulating queries with a few keystrokes, helping them to avoid spelling mistakes and to produce clear query expressions, and so on. Previous work on query auto-completion mainly centers around returning a list of completions to users, aiming to push queries that are most likely intended by the user to the top positions but ignoring the redundancy among the query candidates in the list. Thus, semantically related queries matching the input prefix are often returned together. This may push valuable suggestions out of the list, given that only a limited number of candidates can be shown to the user, which may result in a less than optimal search experience. In this article, we consider the task of diversifying query auto-completion, which aims to return the correct query completions early in a ranked list of candidate completions and at the same time reduce the redundancy among query auto-completion candidates. We develop a greedy query selection approach that predicts query completions based on the current search popularity of candidate completions and on the aspects of previous queries in the same search session. The popularity of completion candidates at query time can be directly aggregated from query logs. However, query aspects are implicitly expressed by previous clicked documents in the search context. To determine the query aspect, we categorize clicked documents of a query using a hierarchy based on the open directory project. Bayesian probabilistic matrix factorization is applied to derive the distribution of queries over all aspects. We quantify the improvement of our greedy query selection model against a state-of-the-art baseline using two large-scale, real-world query logs and show that it beats the baseline in terms of well-known metrics used in query auto-completion and diversification. In addition, we conduct a side-by-side experiment to verify the effectiveness of our proposal.", acknowledgement = ack-nhfb, articleno = "25", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Morsy:2016:ALC, author = "Sara Morsy and George Karypis", title = "Accounting for Language Changes Over Time in Document Similarity Search", journal = j-TOIS, volume = "35", number = "1", pages = "1:1--1:??", month = oct, year = "2016", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2934671", ISSN = "1046-8188", bibdate = "Mon Apr 3 11:29:19 MDT 2017", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Given a query document, ranking the documents in a collection based on how similar they are to the query is an essential task with extensive applications. For collections that contain documents whose creation dates span several decades, this task is further complicated by the fact that the language changes over time. For example, many terms add or lose one or more senses to meet people's evolving needs. To address this problem, we present methods that take advantage of two types of information to account for the language change. The first is the citation network that often exists within the collection, which can be used to link related documents with significantly different creation dates (and hence different language use). The second is the changes in the usage frequency of terms that occur over time, which can indicate changes in their senses and uses. These methods utilize the preceding information while estimating the representation of both documents and terms within the context of nonprobabilistic static and dynamic topic models. Our experiments on two real-world datasets that span more than 40 years show that our proposed methods improve the retrieval performance of existing models and that these improvements are statistically significant.", acknowledgement = ack-nhfb, articleno = "1", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Arguello:2016:EAS, author = "Jaime Arguello and Rob Capra", title = "The Effects of Aggregated Search Coherence on Search Behavior", journal = j-TOIS, volume = "35", number = "1", pages = "2:1--2:??", month = oct, year = "2016", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2935747", ISSN = "1046-8188", bibdate = "Mon Apr 3 11:29:19 MDT 2017", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Aggregated search is the task of combining results from multiple independent search systems in a single Search Engine Results Page (SERP). Aggregated search coherence refers to the extent to which different sources on the SERP focus on similar senses of an ambiguous or underspecified query. In previous studies, we found that the query senses in a set of vertical results can influence user engagement with the web results (the so-called ``spillover'' effect). In this work, we investigate five research questions (RQ1--RQ5) that extend our prior work. First, we investigate the extent to which results from different sources focus on different senses of an ambiguous query (RQ1). Second, we investigate how the vertical-to-web spillover effect varies across different verticals (RQ2). Then, we examine whether the level of spillover depends on the vertical position (RQ3) and on whether the vertical results are displayed with a border and different-colored background to distinguish them from the web results (RQ4). Finally, we propose a new method for displaying results from a particular vertical that are more consistent with the query senses in the web results (RQ5). We evaluate this new method based on how it influences users to make more correct decisions with respect to the web results-to engage with the web results when at least one of them is relevant and to avoid engaging with the web results otherwise. Our results show the following trends. In terms of RQ1, our analysis suggests that the top results from the web search engine are more diversified than the top results from our four different verticals considered (images, news, shopping, and video). In terms of RQ2, we found a stronger spillover effect for the images vertical than the news, shopping, and video verticals. In terms of RQ3, we found a stronger level of spillover when the vertical was positioned at the top of the SERP versus to the right side of the web results. In terms of RQ4, we found an interesting additive effect between the vertical's position and displaying the vertical results enclosed in a border and with a different-colored background-the image vertical had no spillover when presented to the right side of the web results and with a border and background. Finally, in terms of RQ5, we found that our proposed vertical results selection approach can influence users to make more correct predictions about their level of engagement with the web results.", acknowledgement = ack-nhfb, articleno = "2", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Zhang:2016:CRD, author = "Yating Zhang and Adam Jatowt and Katsumi Tanaka", title = "Causal Relationship Detection in Archival Collections of Product Reviews for Understanding Technology Evolution", journal = j-TOIS, volume = "35", number = "1", pages = "3:1--3:??", month = oct, year = "2016", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2937752", ISSN = "1046-8188", bibdate = "Mon Apr 3 11:29:19 MDT 2017", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Technology progress is one of the key reasons behind today's rapid changes in lifestyles. Knowing how products and objects evolve can not only help with understanding the evolutionary patterns in our society but can also provide clues on effective product design and can offer support for predicting the future. We propose a general framework for analyzing technology's impact on our lives through detecting cause--effect relationships, where causes represent changes in technology while effects are changes in social life, such as new activities or new ways of using products. We address the challenge of viewing technology evolution through the ``social impact lens'' by mining causal relationships from the long-term collections of product reviews. In particular, we first propose dividing vocabulary into two groups: terms describing product features (called physical terms ) and terms representing product usage (called conceptual terms ). We then search for two kinds of changes related to the appearance of terms: frequency-based and context-based changes. The former indicate periods when a word was significantly more frequently used, whereas the latter indicate periods of high change in the word's context. Based on the detected changes, we then search for causal term pairs such that the change in the physical term triggers the change in the conceptual term. We next extend our approach to finding causal relationships between word groups such as a group of words representing the same technology and causing a given conceptual change or group of words representing two different technologies that simultaneously ``co-cause'' a conceptual change. We conduct experiments on different product types using the Amazon Product Review Dataset, which spans 1995 to 2013, and we demonstrate that our approaches outperform state-of-the-art baselines.", acknowledgement = ack-nhfb, articleno = "3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Molino:2016:SQA, author = "Piero Molino and Luca Maria Aiello and Pasquale Lops", title = "Social Question Answering: Textual, User, and Network Features for Best Answer Prediction", journal = j-TOIS, volume = "35", number = "1", pages = "4:1--4:??", month = oct, year = "2016", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2948063", ISSN = "1046-8188", bibdate = "Mon Apr 3 11:29:19 MDT 2017", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Community question answering (CQA) sites use a collaborative paradigm to satisfy complex information needs. Although the task of matching questions to their best answers has been tackled for more than a decade, the social question-answering practice is a complex process. The factors influencing the accuracy of question-answer matching are many and hard to disentangle. We approach the task from an application-oriented perspective, probing the space of several dimensions relevant to this problem: features, algorithms, and topics. We gather under a learning to rank framework the most extensive feature set used in literature to date, including 225 features from five different families. We test the power of such features in predicting the best answer to a question on the largest dataset from Yahoo Answers used for this task so far (40M answers) and provide a faceted analysis of the results along different topical areas and question types. We propose a novel family of distributional semantics measures that most of the time can seamlessly replace widely used linguistic similarity features, being more than one order of magnitude faster to compute and providing greater predictive power. The best feature set reaches an improvement between 11\% and 26\% in P@1 compared to recent well-established state-of-the-art methods.", acknowledgement = ack-nhfb, articleno = "4", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Zhang:2016:TRM, author = "Chenyi Zhang and Hongwei Liang and Ke Wang", title = "Trip Recommendation Meets Real-World Constraints: {POI} Availability, Diversity, and Traveling Time Uncertainty", journal = j-TOIS, volume = "35", number = "1", pages = "5:1--5:??", month = oct, year = "2016", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2948065", ISSN = "1046-8188", bibdate = "Mon Apr 3 11:29:19 MDT 2017", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "As location-based social network (LBSN) services become increasingly popular, trip recommendation that recommends a sequence of points of interest (POIs) to visit for a user emerges as one of many important applications of LBSNs. Personalized trip recommendation tailors to users' specific tastes by learning from past check-in behaviors of users and their peers. Finding the optimal trip that maximizes user's experiences for a given time budget constraint is an NP-hard problem and previous solutions do not consider three practical and important constraints. One constraint is POI availability, where a POI may be only available during a certain time window. Another constraint is uncertain traveling time, where the traveling time between two POIs is uncertain. In addition, the diversity of the POIs included in the trip plays an important role in user's final adoptions. This work presents efficient solutions to personalized trip recommendation by incorporating these constraints and leveraging them to prune the search space. We evaluated the efficiency and effectiveness of our solutions on real-life LBSN datasets.", acknowledgement = ack-nhfb, articleno = "5", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Azmi:2016:AAW, author = "Aqil M. Azmi and Nouf A. Alshenaifi", title = "Answering {Arabic} Why-Questions: Baseline vs. {RST}-Based Approach", journal = j-TOIS, volume = "35", number = "1", pages = "6:1--6:??", month = oct, year = "2016", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2950049", ISSN = "1046-8188", bibdate = "Mon Apr 3 11:29:19 MDT 2017", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "A Question Answering (QA) system is concerned with building a system that automatically answer questions posed by humans in a natural language. Compared to other languages, little effort was directed towards QA systems for Arabic. Due to the difficulty of handling why -questions, most Arabic QA systems tend to ignore it. In this article, we specifically address the why -question for Arabic using two different approaches and compare their performance and the quality of their answer. The first is the baseline approach, a generic method that is used to answer all types of questions, including factoid; and for the second approach, we use Rhetorical Structure Theory (RST). We evaluate both schemes using a corpus of 700 textual documents in different genres collected from Open Source Arabic Corpora (OSAC), and a set of 100 question-answer pairs. Overall, the performance measures of recall, precision, and c@1 was 68\% (all three measures) for the baseline approach, and 71\%, 78\%, and 77.4\%, respectively, for the RST-based approach. The recently introduced extension of the accuracy, the c@1 measure, rewards unanswered questions over those wrongly answered.", acknowledgement = ack-nhfb, articleno = "6", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Baly:2016:MFM, author = "Ramy Baly and Roula Hobeica and Hazem Hajj and Wassim El-Hajj and Khaled Bashir Shaban and Ahmad Al-Sallab", title = "A Meta-Framework for Modeling the Human Reading Process in Sentiment Analysis", journal = j-TOIS, volume = "35", number = "1", pages = "7:1--7:??", month = oct, year = "2016", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2950050", ISSN = "1046-8188", bibdate = "Mon Apr 3 11:29:19 MDT 2017", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "This article introduces a sentiment analysis approach that adopts the way humans read, interpret, and extract sentiment from text. Our motivation builds on the assumption that human interpretation should lead to the most accurate assessment of sentiment in text. We call this automated process Human Reading for Sentiment (HRS). Previous research in sentiment analysis has produced many frameworks that can fit one or more of the HRS aspects; however, none of these methods has addressed them all in one approach. HRS provides a meta-framework for developing new sentiment analysis methods or improving existing ones. The proposed framework provides a theoretical lens for zooming in and evaluating aspects of any sentiment analysis method to identify gaps for improvements towards matching the human reading process. Key steps in HRS include the automation of humans low-level and high-level cognitive text processing. This methodology paves the way towards the integration of psychology with computational linguistics and machine learning to employ models of pragmatics and discourse analysis for sentiment analysis. HRS is tested with two state-of-the-art methods; one is based on feature engineering, and the other is based on deep learning. HRS highlighted the gaps in both methods and showed improvements for both.", acknowledgement = ack-nhfb, articleno = "7", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Zhao:2016:PLB, author = "Wayne Xin Zhao and Ningnan Zhou and Wenhui Zhang and Ji-Rong Wen and Shan Wang and Edward Y. Chang", title = "A Probabilistic Lifestyle-Based Trajectory Model for Social Strength Inference from Human Trajectory Data", journal = j-TOIS, volume = "35", number = "1", pages = "8:1--8:??", month = oct, year = "2016", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2948064", ISSN = "1046-8188", bibdate = "Mon Apr 3 11:29:19 MDT 2017", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "With the pervasiveness of location-based social networks, it becomes increasingly important to consider the social characteristics of locations shared among persons. Several studies have been proposed to infer social strength by using trajectory similarity. However, these studies have two major shortcomings. First, they rely on the explicit co-occurrence of check-in locations. In this situation, a user pair of two friends who seldom share common locations or a user pair of two strangers who heavily share common visited locations will receive an unreliable estimation of the real social strength between them. Second, these studies do not consider how the overall trajectory patterns of users change with the varying of living styles. In this article, we propose a probabilistic generative model to mine latent lifestyle-related patterns from human trajectory data for inferring social strength. It can automatically learn functionality topics consisting of locations with similar service functions and transition probabilities over the set of functionality topics. Furthermore, a lifestyle is modeled as a unique transition probability matrix over the set of functionality topics. A user has a preference distribution over the set of lifestyles, and he or she is able to select over multiple lifestyles to adapt to different living contexts. The learned lifestyle-related patterns are subsequently used as features in a supervised learner for both strength estimation and link prediction. We conduct extensive experiments to evaluate the performance of the proposed method on two real-world datasets. The experimental results demonstrate the effectiveness of our proposed method.", acknowledgement = ack-nhfb, articleno = "8", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Jiang:2016:CLT, author = "Di Jiang and Yongxin Tong and Yuanfeng Song", title = "Cross-Lingual Topic Discovery From Multilingual Search Engine Query Log", journal = j-TOIS, volume = "35", number = "2", pages = "9:1--9:??", month = dec, year = "2016", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2956235", ISSN = "1046-8188", bibdate = "Mon Apr 3 11:29:19 MDT 2017", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Today, major commercial search engines are operating in a multinational fashion to provide web search services for millions of users who compose search queries by different languages. Hence, the search engine query log, which serves as the backbone of many search engine applications, records millions of users' search history in a wide spectrum of human languages and demonstrates a strong multilingual phenomenon. However, with its salience, the multilingual nature of a search engine query log is usually ignored by existing works, which usually consider query log entries of different languages as being orthogonal and independent. This kind of oversimplified assumption heavily distorts the underlying structure of web search data. In this article, we pioneer in recognition of the multilingual nature of a query log and make the first attempt to cross the language barrier in query logs. We propose a novel model named Cross-Lingual Query Log Topic Model (CL-QLTM) to analyze query logs from a cross-lingual perspective and derive the latent topics of web search data. The CL-QLTM comprehensively integrates web search data in different languages by collectively utilizing cross-lingual dictionaries, as well as the co-occurrence relations in the query log. In order to relieve the efficiency bottleneck of applying the CL-QLTM on voluminous query logs, we propose an efficient parameter inference algorithm based on the MapReduce computing paradigm. Both qualitative and quantitative experimental results show that the CL-QLTM is able to effectively derive cross-lingual topics from multilingual query logs and spawn a wide spectrum of new search engine applications.", acknowledgement = ack-nhfb, articleno = "9", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Wang:2016:ROC, author = "Shuaiqiang Wang and Shanshan Huang and Tie-Yan Liu and Jun Ma and Zhumin Chen and Jari Veijalainen", title = "Ranking-Oriented Collaborative Filtering: a Listwise Approach", journal = j-TOIS, volume = "35", number = "2", pages = "10:1--10:??", month = dec, year = "2016", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2960408", ISSN = "1046-8188", bibdate = "Mon Apr 3 11:29:19 MDT 2017", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Collaborative filtering (CF) is one of the most effective techniques in recommender systems, which can be either rating oriented or ranking oriented. Ranking-oriented CF algorithms demonstrated significant performance gains in terms of ranking accuracy, being able to estimate a precise preference ranking of items for each user rather than the absolute ratings (as rating-oriented CF algorithms do). Conventional memory-based ranking-oriented CF can be referred to as pairwise algorithms. They represent each user as a set of preferences on each pair of items for similarity calculations and predictions. In this study, we propose ListCF, a novel listwise CF paradigm that seeks improvement in both accuracy and efficiency in comparison with pairwise CF. In ListCF, each user is represented as a probability distribution of the permutations over rated items based on the Plackett-Luce model, and the similarity between users is measured based on the Kullback--Leibler divergence between their probability distributions over the set of commonly rated items. Given a target user and the most similar users, ListCF directly predicts a total order of items for each user based on similar users' probability distributions over permutations of the items. Besides, we also reveal insightful connections among pointwise, pairwise, and listwise CF algorithms from the perspective of the matrix representations. In addition, to make our algorithm more scalable and adaptive, we present an incremental algorithm for ListCF, which allows incrementally updating the similarities between users when certain user submits a new rating or updates an existing rating. Extensive experiments on benchmark datasets in comparison with the state-of-the-art approaches demonstrate the promise of our approach.", acknowledgement = ack-nhfb, articleno = "10", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Yin:2016:JMU, author = "Hongzhi Yin and Bin Cui and Xiaofang Zhou and Weiqing Wang and Zi Huang and Shazia Sadiq", title = "Joint Modeling of User Check-in Behaviors for Real-time Point-of-Interest Recommendation", journal = j-TOIS, volume = "35", number = "2", pages = "11:1--11:??", month = dec, year = "2016", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2873055", ISSN = "1046-8188", bibdate = "Mon Apr 3 11:29:19 MDT 2017", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Point-of-Interest (POI) recommendation has become an important means to help people discover attractive and interesting places, especially when users travel out of town. However, the extreme sparsity of a user-POI matrix creates a severe challenge. To cope with this challenge, we propose a unified probabilistic generative model, the Topic-Region Model (TRM), to simultaneously discover the semantic, temporal, and spatial patterns of users' check-in activities, and to model their joint effect on users' decision making for selection of POIs to visit. To demonstrate the applicability and flexibility of TRM, we investigate how it supports two recommendation scenarios in a unified way, that is, hometown recommendation and out-of-town recommendation. TRM effectively overcomes data sparsity by the complementarity and mutual enhancement of the diverse information associated with users' check-in activities (e.g., check-in content, time, and location) in the processes of discovering heterogeneous patterns and producing recommendations. To support real-time POI recommendations, we further extend the TRM model to an online learning model, TRM-Online, to track changing user interests and speed up the model training. In addition, based on the learned model, we propose a clustering-based branch and bound algorithm (CBB) to prune the POI search space and facilitate fast retrieval of the top- k recommendations. We conduct extensive experiments to evaluate the performance of our proposals on two real-world datasets, including recommendation effectiveness, overcoming the cold-start problem, recommendation efficiency, and model-training efficiency. The experimental results demonstrate the superiority of our TRM models, especially TRM-Online, compared with state-of-the-art competitive methods, by making more effective and efficient mobile recommendations. In addition, we study the importance of each type of pattern in the two recommendation scenarios, respectively, and find that exploiting temporal patterns is most important for the hometown recommendation scenario, while the semantic patterns play a dominant role in improving the recommendation effectiveness for out-of-town users.", acknowledgement = ack-nhfb, articleno = "11", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Chen:2016:BRU, author = "Jia Chen and Qin Jin and Shiwan Zhao and Shenghua Bao and Li Zhang and Zhong Su and Yong Yu", title = "Boosting Recommendation in Unexplored Categories by User Price Preference", journal = j-TOIS, volume = "35", number = "2", pages = "12:1--12:??", month = dec, year = "2016", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2978579", ISSN = "1046-8188", bibdate = "Mon Apr 3 11:29:19 MDT 2017", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "State-of-the-art methods for product recommendation encounter a significant performance drop in categories where a user has no purchase history. This problem needs to be addressed since current online retailers are moving beyond single category and attempting to be diversified. In this article, we investigate the challenging problem of product recommendation in unexplored categories and discover that the price, a factor comparable across categories, can improve the recommendation performance significantly. We introduce the price utility concept to characterize users' sense of price and propose three different utility functions. We show that user price preference in a category is a distribution and we mine typical user price preference patterns based on three different types of distance between distributions. We fuse user price preference through regularization and joint factorization to boost recommendation performance in both browsing and buying shopping orientations. Experimental results show that fusing user price preference improves performance in a series of recommendation tasks: unexplored category recommendation, product recommendation under a given unexplored category, and product recommendation under generic unexplored categories.", acknowledgement = ack-nhfb, articleno = "12", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Hu:2016:LIP, author = "Liang Hu and Longbing Cao and Jian Cao and Zhiping Gu and Guandong Xu and Dingyu Yang", title = "Learning Informative Priors from Heterogeneous Domains to Improve Recommendation in Cold-Start User Domains", journal = j-TOIS, volume = "35", number = "2", pages = "13:1--13:??", month = dec, year = "2016", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2976737", ISSN = "1046-8188", bibdate = "Mon Apr 3 11:29:19 MDT 2017", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "In the real-world environment, users have sufficient experience in their focused domains but lack experience in other domains. Recommender systems are very helpful for recommending potentially desirable items to users in unfamiliar domains, and cross-domain collaborative filtering is therefore an important emerging research topic. However, it is inevitable that the cold-start issue will be encountered in unfamiliar domains due to the lack of feedback data. The Bayesian approach shows that priors play an important role when there are insufficient data, which implies that recommendation performance can be significantly improved in cold-start domains if informative priors can be provided. Based on this idea, we propose a Weighted Irregular Tensor Factorization (WITF) model to leverage multi-domain feedback data across all users to learn the cross-domain priors w.r.t. both users and items. The features learned from WITF serve as the informative priors on the latent factors of users and items in terms of weighted matrix factorization models. Moreover, WITF is a unified framework for dealing with both explicit feedback and implicit feedback. To prove the effectiveness of our approach, we studied three typical real-world cases in which a collection of empirical evaluations were conducted on real-world datasets to compare the performance of our model and other state-of-the-art approaches. The results show the superiority of our model over comparison models.", acknowledgement = ack-nhfb, articleno = "13", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Thomason:2016:CTA, author = "Alasdair Thomason and Nathan Griffiths and Victor Sanchez", title = "Context Trees: Augmenting Geospatial Trajectories with Context", journal = j-TOIS, volume = "35", number = "2", pages = "14:1--14:??", month = dec, year = "2016", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2978578", ISSN = "1046-8188", bibdate = "Mon Apr 3 11:29:19 MDT 2017", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Exposing latent knowledge in geospatial trajectories has the potential to provide a better understanding of the movements of individuals and groups. Motivated by such a desire, this work presents the context tree, a new hierarchical data structure that summarises the context behind user actions in a single model. We propose a method for context tree construction that augments geospatial trajectories with land usage data to identify such contexts. Through evaluation of the construction method and analysis of the properties of generated context trees, we demonstrate the foundation for understanding and modelling behaviour afforded. Summarising user contexts into a single data structure gives easy access to information that would otherwise remain latent, providing the basis for better understanding and predicting the actions and behaviours of individuals and groups. Finally, we also present a method for pruning context trees for use in applications where it is desirable to reduce the size of the tree while retaining useful information.", acknowledgement = ack-nhfb, articleno = "14", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Dato:2016:FRA, author = "Domenico Dato and Claudio Lucchese and Franco Maria Nardini and Salvatore Orlando and Raffaele Perego and Nicola Tonellotto and Rossano Venturini", title = "Fast Ranking with Additive Ensembles of Oblivious and Non-Oblivious Regression Trees", journal = j-TOIS, volume = "35", number = "2", pages = "15:1--15:??", month = dec, year = "2016", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2987380", ISSN = "1046-8188", bibdate = "Mon Apr 3 11:29:19 MDT 2017", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Learning-to-Rank models based on additive ensembles of regression trees have been proven to be very effective for scoring query results returned by large-scale Web search engines. Unfortunately, the computational cost of scoring thousands of candidate documents by traversing large ensembles of trees is high. Thus, several works have investigated solutions aimed at improving the efficiency of document scoring by exploiting advanced features of modern CPUs and memory hierarchies. In this article, we present QuickScorer, a new algorithm that adopts a novel cache-efficient representation of a given tree ensemble, performs an interleaved traversal by means of fast bitwise operations, and supports ensembles of oblivious trees. An extensive and detailed test assessment is conducted on two standard Learning-to-Rank datasets and on a novel very large dataset we made publicly available for conducting significant efficiency tests. The experiments show unprecedented speedups over the best state-of-the-art baselines ranging from $ 1.9 \times $ to $ 6.6 \times $. The analysis of low-level profiling traces shows that QuickScorer efficiency is due to its cache-aware approach in terms of both data layout and access patterns and to a control flow that entails very low branch mis-prediction rates.", acknowledgement = ack-nhfb, articleno = "15", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Liu:2017:TAC, author = "Yiqun Liu and Xiaohui Xie and Chao Wang and Jian-Yun Nie and Min Zhang and Shaoping Ma", title = "Time-Aware Click Model", journal = j-TOIS, volume = "35", number = "3", pages = "16:1--16:??", month = jun, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2988230", ISSN = "1046-8188", ISSN-L = "0734-2047", bibdate = "Tue Jul 11 17:07:53 MDT 2017", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Click-through information is considered as a valuable source of users' implicit relevance feedback for commercial search engines. As existing studies have shown that the search result position in a search engine result page (SERP) has a very strong influence on users' examination behavior, most existing click models are position based, assuming that users examine results from top to bottom in a linear fashion. Although these click models have been successful, most do not take temporal information into account. As many existing studies have shown, click dwell time and click sequence information are strongly correlated with users' perceived relevance and search satisfaction. Incorporating temporal information may be important to improve performance of user click models for Web searches. In this article, we investigate the problem of properly incorporating temporal information into click models. We first carry out a laboratory eye-tracking study to analyze users' examination behavior in different click sequences and find that the user common examination path among adjacent clicks is linear. Next, we analyze the user dwell time distribution in different search logs and find that we cannot simply use a click dwell time threshold (e.g., 30 seconds) to distinguish relevant/irrelevant results. Finally, we propose a novel time-aware click model (TACM), which captures the temporal information of user behavior. We compare the TACM to several existing click models using two real-world search engine logs. Experimental results show that the TACM outperforms other click models in terms of both predicting click behavior (perplexity) and estimating result relevance (NDCG).", acknowledgement = ack-nhfb, articleno = "16", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Connor:2017:HEI, author = "Richard Connor and Franco Alberto Cardillo and Lucia Vadicamo and Fausto Rabitti", title = "{Hilbert} Exclusion: Improved Metric Search through Finite Isometric Embeddings", journal = j-TOIS, volume = "35", number = "3", pages = "17:1--17:??", month = jun, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3001583", ISSN = "1046-8188", ISSN-L = "0734-2047", bibdate = "Tue Jul 11 17:07:53 MDT 2017", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Most research into similarity search in metric spaces relies on the triangle inequality property. This property allows the space to be arranged according to relative distances to avoid searching some subspaces. We show that many common metric spaces, notably including those using Euclidean and Jensen-Shannon distances, also have a stronger property, sometimes called the four-point property: In essence, these spaces allow an isometric embedding of any four points in three-dimensional Euclidean space, as well as any three points in two-dimensional Euclidean space. In fact, we show that any space that is isometrically embeddable in Hilbert space has the stronger property. This property gives stronger geometric guarantees, and one in particular, which we name the Hilbert Exclusion property, allows any indexing mechanism which uses hyperplane partitioning to perform better. One outcome of this observation is that a number of state-of-the-art indexing mechanisms over high-dimensional spaces can be easily refined to give a significant increase in performance; furthermore, the improvement given is greater in higher dimensions. This therefore leads to a significant improvement in the cost of metric search in these spaces.", acknowledgement = ack-nhfb, articleno = "17", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Miao:2017:CEO, author = "Zhongchen Miao and Kai Chen and Yi Fang and Jianhua He and Yi Zhou and Wenjun Zhang and Hongyuan Zha", title = "Cost-Effective Online Trending Topic Detection and Popularity Prediction in Microblogging", journal = j-TOIS, volume = "35", number = "3", pages = "18:1--18:??", month = jun, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3001833", ISSN = "1046-8188", ISSN-L = "0734-2047", bibdate = "Tue Jul 11 17:07:53 MDT 2017", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Identifying topic trends on microblogging services such as Twitter and estimating those topics' future popularity have great academic and business value, especially when the operations can be done in real time. For any third party, however, capturing and processing such huge volumes of real-time data in microblogs are almost infeasible tasks, as there always exist API (Application Program Interface) request limits, monitoring and computing budgets, as well as timeliness requirements. To deal with these challenges, we propose a cost-effective system framework with algorithms that can automatically select a subset of representative users in microblogging networks in offline, under given cost constraints. Then the proposed system can online monitor and utilize only these selected users' real-time microposts to detect the overall trending topics and predict their future popularity among the whole microblogging network. Therefore, our proposed system framework is practical for real-time usage as it avoids the high cost in capturing and processing full real-time data, while not compromising detection and prediction performance under given cost constraints. Experiments with real microblogs dataset show that by tracking only 500 users out of 0.6 million users and processing no more than 30,000 microposts daily, about 92\% trending topics could be detected and predicted by the proposed system and, on average, more than 10 hours earlier than they appear in official trends lists.", acknowledgement = ack-nhfb, articleno = "18", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Maddalena:2017:CRM, author = "Eddy Maddalena and Stefano Mizzaro and Falk Scholer and Andrew Turpin", title = "On Crowdsourcing Relevance Magnitudes for Information Retrieval Evaluation", journal = j-TOIS, volume = "35", number = "3", pages = "19:1--19:??", month = jun, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3002172", ISSN = "1046-8188", ISSN-L = "0734-2047", bibdate = "Tue Jul 11 17:07:53 MDT 2017", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Magnitude estimation is a psychophysical scaling technique for the measurement of sensation, where observers assign numbers to stimuli in response to their perceived intensity. We investigate the use of magnitude estimation for judging the relevance of documents for information retrieval evaluation, carrying out a large-scale user study across 18 TREC topics and collecting over 50,000 magnitude estimation judgments using crowdsourcing. Our analysis shows that magnitude estimation judgments can be reliably collected using crowdsourcing, are competitive in terms of assessor cost, and are, on average, rank-aligned with ordinal judgments made by expert relevance assessors. We explore the application of magnitude estimation for IR evaluation, calibrating two gain-based effectiveness metrics, nDCG and ERR, directly from user-reported perceptions of relevance. A comparison of TREC system effectiveness rankings based on binary, ordinal, and magnitude estimation relevance shows substantial variation; in particular, the top systems ranked using magnitude estimation and ordinal judgments differ substantially. Analysis of the magnitude estimation scores shows that this effect is due in part to varying perceptions of relevance: different users have different perceptions of the impact of relative differences in document relevance. These results have direct implications for IR evaluation, suggesting that current assumptions about a single view of relevance being sufficient to represent a population of users are unlikely to hold.", acknowledgement = ack-nhfb, articleno = "19", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Zhang:2017:TAP, author = "Dongxiang Zhang and Long Guo and Liqiang Nie and Jie Shao and Sai Wu and Heng Tao Shen", title = "Targeted Advertising in Public Transportation Systems with Quantitative Evaluation", journal = j-TOIS, volume = "35", number = "3", pages = "20:1--20:??", month = jun, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3003725", ISSN = "1046-8188", ISSN-L = "0734-2047", bibdate = "Tue Jul 11 17:07:53 MDT 2017", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "In spite of vast business potential, targeted advertising in public transportation systems is a grossly unexplored research area. For instance, SBS Transit in Singapore can reach 1 billion passengers per year but the annual advertising revenue contributes less than \$35 million. To bridge the gap, we propose a probabilistic data model that captures the motion patterns and user interests so as to quantitatively evaluate the impact of an advertisement among the passengers. In particular, we leverage hundreds of millions of bus/train boarding transaction records to quantitatively estimate the probability as well as the extent of a user being influenced by an ad. Based on the influence model, we study a top-$k$ retrieval problem for bus/train ad recommendation, which acts as a primitive operator to support various advanced applications. We solve the retrieval problem efficiently to support real-time decision making. In the experimental study, we use the dataset from SBS Transit as a case study to verify the effectiveness and efficiency of our proposed methodologies.", acknowledgement = ack-nhfb, articleno = "20", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Sadeghi:2017:RFB, author = "Seyedeh Sargol Sadeghi and Roi Blanco and Peter Mika and Mark Sanderson and Falk Scholer and David Vallet", title = "Re-Finding Behaviour in Vertical Domains", journal = j-TOIS, volume = "35", number = "3", pages = "21:1--21:??", month = jun, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/2975590", ISSN = "1046-8188", ISSN-L = "0734-2047", bibdate = "Tue Jul 11 17:07:53 MDT 2017", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Re-finding is the process of searching for information that a user has previously encountered and is a common activity carried out with information retrieval systems. In this work, we investigate re-finding in the context of vertical search, differentiating and modeling user re-finding behavior within different media and topic domains, including images, news, reference material, and movies. We distinguish the re-finding behavior in vertical domains from re-finding in a general search context and engineer features that are effective in differentiating re-finding across the domains. The features are then used to build machine-learned models, achieving an accuracy of re-finding detection in verticals of 85.7\% on average. Our results demonstrate that detecting re-finding in specific verticals is more difficult than examining re-finding for general search tasks. We then investigate the effectiveness of differentiating re-finding behavior in two restricted contexts: We consider the case where the history of a searcher's interactions with the search system is not available. In this scenario, our features and models achieve an average accuracy of 77.5\% across the domains. We then examine the detection of re-finding during the early part of a search session. Both of these restrictions represent potential real-world search scenarios, where a system is attempting to learn about a user but may have limited information available. Finally, we investigate in which types of domains re-finding is most difficult. Here, it would appear that re-finding images is particularly challenging for users. This research has implications for search engine design, in terms of adapting search results by predicting the type of user tasks and potentially enabling the presentation of vertical-specific results when re-finding is identified. To the best of our knowledge, this is the first work to investigate the issue of vertical re-finding.", acknowledgement = ack-nhfb, articleno = "21", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Konow:2017:IT, author = "Roberto Konow and Gonzalo Navarro and Charles L. A. Clarke and Alejandro L{\'o}pez-Ort{\'\i}z", title = "Inverted Treaps", journal = j-TOIS, volume = "35", number = "3", pages = "22:1--22:??", month = jun, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3007186", ISSN = "1046-8188", ISSN-L = "0734-2047", bibdate = "Tue Jul 11 17:07:53 MDT 2017", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "We introduce a new representation of the inverted index that performs faster ranked unions and intersections while using similar space. Our index is based on the treap data structure, which allows us to intersect/merge the document identifiers while simultaneously thresholding by frequency, instead of the costlier two-step classical processing methods. To achieve compression, we represent the treap topology using different alternative compact data structures. Further, the treap invariants allow us to elegantly encode differentially both document identifiers and frequencies. We also show how to extend this representation to support incremental updates over the index. Results show that, under the tf-idf scoring scheme, our index uses about the same space as state-of-the-art compact representations, while performing up to 2--20 times faster on ranked single-word, union, or intersection queries. Under the BM25 scoring scheme, our index may use up to 40\% more space than the others and outperforms them less frequently but still reaches improvement factors of 2--20 in the best cases. The index supporting incremental updates poses an overhead of 50\%--100\% over the static variants in terms of space, construction, and query time.", acknowledgement = ack-nhfb, articleno = "22", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{White:2017:SRP, author = "Ryen W. White and Fernando Diaz and Qi Guo", title = "Search Result Prefetching on Desktop and Mobile", journal = j-TOIS, volume = "35", number = "3", pages = "23:1--23:??", month = jun, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3015466", ISSN = "1046-8188", ISSN-L = "0734-2047", bibdate = "Tue Jul 11 17:07:53 MDT 2017", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Search result examination is an important part of searching. High page load latency for landing pages (clicked search results) can reduce the efficiency of the search process. Proactively prefetching landing pages in advance of clickthrough can save searchers valuable time. However, prefetching consumes resources (primarily bandwidth and battery) that are wasted unless the prefetched results are requested by searchers. Balancing the costs in prefetching particular results against the benefits in reduced latency to searchers represents the search result prefetching challenge. In this article, we introduce this challenge and present methods to address it in both desktop and mobile settings. Our methods leverage searchers' cursor movements (on desktop) and viewport-based viewing behavior (on mobile) on search engine result pages (SERPs) in real time to dynamically estimate the result that searchers will request next. We demonstrate through large-scale log analysis that our approach significantly outperforms three strong baselines that prefetch results based on (i) the search engine result ranking (prefetch top-ranked results), (ii) past SERP clicks from all searchers for the query (prefetch popular results), or (iii) past SERP clicks from the current searcher for the query (prefetch results that the searcher prefers). Our promising findings have implications for the design of search support in desktop and mobile settings that makes the search process more efficient.", acknowledgement = ack-nhfb, articleno = "23", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Moffat:2017:IUE, author = "Alistair Moffat and Peter Bailey and Falk Scholer and Paul Thomas", title = "Incorporating User Expectations and Behavior into the Measurement of Search Effectiveness", journal = j-TOIS, volume = "35", number = "3", pages = "24:1--24:??", month = jun, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3052768", ISSN = "1046-8188", ISSN-L = "0734-2047", bibdate = "Tue Jul 11 17:07:53 MDT 2017", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Information retrieval systems aim to help users satisfy information needs. We argue that the goal of the person using the system, and the pattern of behavior that they exhibit as they proceed to attain that goal, should be incorporated into the methods and techniques used to evaluate the effectiveness of IR systems, so that the resulting effectiveness scores have a useful interpretation that corresponds to the users' search experience. In particular, we investigate the role of search task complexity, and show that it has a direct bearing on the number of relevant answer documents sought by users in response to an information need, suggesting that useful effectiveness metrics must be goal sensitive. We further suggest that user behavior while scanning results listings is affected by the rate at which their goal is being realized, and hence that appropriate effectiveness metrics must be adaptive to the presence (or not) of relevant documents in the ranking. In response to these two observations, we present a new effectiveness metric, INST, that has both of the desired properties: INST employs a parameter T, a direct measure of the user's search goal that adjusts the top-weightedness of the evaluation score; moreover, as progress towards the target T is made, the modeled user behavior is adapted, to reflect the remaining expectations. INST is experimentally compared to previous effectiveness metrics, including Average Precision (AP), Normalized Discounted Cumulative Gain (NDCG), and Rank-Biased Precision (RBP), demonstrating our claims as to INST's usefulness. Like RBP, INST is a weighted-precision metric, meaning that each score can be accompanied by a residual that quantifies the extent of the score uncertainty caused by unjudged documents. As part of our experimentation, we use crowd-sourced data and score residuals to demonstrate that a wide range of queries arise for even quite specific information needs, and that these variant queries introduce significant levels of residual uncertainty into typical experimental evaluations. These causes of variability have wide-reaching implications for experiment design, and for the construction of test collections.", acknowledgement = ack-nhfb, articleno = "24", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Hu:2017:IQR, author = "Liang Hu and Longbing Cao and Jian Cao and Zhiping Gu and Guandong Xu and Jie Wang", title = "Improving the Quality of Recommendations for Users and Items in the Tail of Distribution", journal = j-TOIS, volume = "35", number = "3", pages = "25:1--25:??", month = jun, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3052769", ISSN = "1046-8188", ISSN-L = "0734-2047", bibdate = "Tue Jul 11 17:07:53 MDT 2017", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Short-head and long-tail distributed data are widely observed in the real world. The same is true of recommender systems (RSs), where a small number of popular items dominate the choices and feedback data while the rest only account for a small amount of feedback. As a result, most RS methods tend to learn user preferences from popular items since they account for most data. However, recent research in e-commerce and marketing has shown that future businesses will obtain greater profit from long-tail selling. Yet, although the number of long-tail items and users is much larger than that of short-head items and users, in reality, the amount of data associated with long-tail items and users is much less. As a result, user preferences tend to be popularity-biased. Furthermore, insufficient data makes long-tail items and users more vulnerable to shilling attack. To improve the quality of recommendations for items and users in the tail of distribution, we propose a coupled regularization approach that consists of two latent factor models: C-HMF, for enhancing credibility, and S-HMF, for emphasizing specialty on user choices. Specifically, the estimates learned from C-HMF and S-HMF recurrently serve as the empirical priors to regularize one another. Such coupled regularization leads to the comprehensive effects of final estimates, which produce more qualitative predictions for both tail users and tail items. To assess the effectiveness of our model, we conduct empirical evaluations on large real-world datasets with various metrics. The results prove that our approach significantly outperforms the compared methods.", acknowledgement = ack-nhfb, articleno = "25", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Huang:2017:ESK, author = "Minlie Huang and Qiao Qian and Xiaoyan Zhu", title = "Encoding Syntactic Knowledge in Neural Networks for Sentiment Classification", journal = j-TOIS, volume = "35", number = "3", pages = "26:1--26:??", month = jun, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3052770", ISSN = "1046-8188", ISSN-L = "0734-2047", bibdate = "Tue Jul 11 17:07:53 MDT 2017", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Phrase/Sentence representation is one of the most important problems in natural language processing. Many neural network models such as Convolutional Neural Network (CNN), Recursive Neural Network (RNN), and Long Short-Term Memory (LSTM) have been proposed to learn representations of phrase/sentence, however, rich syntactic knowledge has not been fully explored when composing a longer text from its shorter constituent words. In most traditional models, only word embeddings are utilized to compose phrase/sentence representations, while the syntactic information of words is yet to be explored. In this article, we discover that encoding syntactic knowledge (part-of-speech tag) in neural networks can enhance sentence/phrase representation. Specifically, we propose to learn tag-specific composition functions and tag embeddings in recursive neural networks, and propose to utilize POS tags to control the gates of tree-structured LSTM networks. We evaluate these models on two benchmark datasets for sentiment classification, and demonstrate that improvements can be obtained with such syntactic knowledge encoded.", acknowledgement = ack-nhfb, articleno = "26", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Zhang:2017:CIJ, author = "Dongxiang Zhang and Liqiang Nie and Huanbo Luan and Kian-Lee Tan and Tat-Seng Chua and Heng Tao Shen", title = "Compact Indexing and Judicious Searching for Billion-Scale Microblog Retrieval", journal = j-TOIS, volume = "35", number = "3", pages = "27:1--27:??", month = jun, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3052771", ISSN = "1046-8188", ISSN-L = "0734-2047", bibdate = "Tue Jul 11 17:07:53 MDT 2017", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "In this article, we study the problem of efficient top- k disjunctive query processing in a huge microblog dataset. In terms of compact indexing, we categorize the keywords into rare terms and common terms based on inverse document frequency (idf) and propose tailored block-oriented organization to save memory consumption. In terms of fast searching, we classify the queries into three types based on term category and judiciously design an efficient search algorithm for each type. We conducted extensive experiments on a billion-scale Twitter dataset and examined the performance with both simple and more advanced ranking functions. The results showed that with much smaller index size, our search algorithm achieves a factor of 2--3 times faster speedup over state-of-the-art solutions in both ranking scenarios.", acknowledgement = ack-nhfb, articleno = "27", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Zhang:2017:PLQ, author = "Dongxiang Zhang and Yuchen Li and Ju Fan and Lianli Gao and Fumin Shen and Heng Tao Shen", title = "Processing Long Queries Against Short Text: Top-$k$ Advertisement Matching in News Stream Applications", journal = j-TOIS, volume = "35", number = "3", pages = "28:1--28:??", month = jun, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3052772", ISSN = "1046-8188", ISSN-L = "0734-2047", bibdate = "Tue Jul 11 17:07:53 MDT 2017", bibsource = "http://www.acm.org/pubs/contents/journals/tois/; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Many real applications in real-time news stream advertising call for efficient processing of long queries against short text. In such applications, dynamic news feeds are regarded as queries to match against an advertisement (ad) database for retrieving the k most relevant ads. The existing approaches to keyword retrieval cannot work well in this search scenario when queries are triggered at a very high frequency. To address the problem, we introduce new techniques to significantly improve search performance. First, we devise a two-level partitioning for tight upper bound estimation and a lazy evaluation scheme to delay full evaluation of unpromising candidates, which can bring three to four times performance boosting in a database with 7 million ads. Second, we propose a novel rank-aware block-oriented inverted index to further improve performance. In this index scheme, each entry in an inverted list is assigned a rank according to its importance in the ad. Then, we introduce a block-at-a-time search strategy based on the index scheme to support a much tighter upper bound estimation and a very early termination. We have conducted experiments with real datasets, and the results show that the rank-aware method can further improve performance by an order of magnitude.", acknowledgement = ack-nhfb, articleno = "28", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Wang:2017:SMT, author = "Hongning Wang and Rui Li and Milad Shokouhi and Hang Li and Yi Chang", title = "Search, Mining, and Their Applications on Mobile Devices: Introduction to the Special Issue", journal = j-TOIS, volume = "35", number = "4", pages = "29:1--29:??", month = aug, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3086665", ISSN = "1046-8188", bibdate = "Tue Jan 16 07:16:46 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "In recent years, mobile devices have become the most popular interface for users to retrieve and access information: recent reports show that users spend significantly more time and issue more search queries on mobile devices than on desktops in the United States. The accelerated growth of mobile usage brings unique opportunities to the information retrieval and data mining research communities. Mobile devices capture rich contextual and personal signals that can be leveraged to accurately predict users' intent for serving more relevant content and can even proactively provide novel zero-query recommendations. Apple Siri, Google Now, and Microsoft Cortana are recent examples of such emerging systems. Furthermore, mobile devices constantly generate a huge amount of sensor footprints (e.g., GPS, motion sensors) and user activity data (e.g., used apps) that are often missing from their desktop counterparts. These new sources of implicit and explicit user feedback are valuable for discovering actionable knowledge, and designing better systems that serve each individual the right content at the right time and location. In addition, by aggregating mobile interactions across individuals, one can infer interesting conclusions beyond search and recommendation. Generating real-time traffic estimates is one example of such applications. This special issue focuses on research problems of search, mining, and their applications in mobile devices. Topics of interest in this special issue include but are not limited to mobile data mining and management, mobile search, personalization and recommendation, mobile user interfaces and human-computer interaction, and new applications in the mobile environment. The aim of this special issue is to bring together top experts across multiple disciplines, including information retrieval, data mining, mobile computing, and cyberphysical systems, such that academic and industrial researchers can exchange ideas and share the latest developments on the state of the art and practice of mobile search and mobile data mining.", acknowledgement = ack-nhfb, articleno = "29", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Sun:2017:CIP, author = "Yu Sun and Nicholas Jing Yuan and Xing Xie and Kieran McDonald and Rui Zhang", title = "Collaborative Intent Prediction with Real-Time Contextual Data", journal = j-TOIS, volume = "35", number = "4", pages = "30:1--30:??", month = aug, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3041659", ISSN = "1046-8188", bibdate = "Tue Jan 16 07:16:46 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Intelligent personal assistants on mobile devices such as Apple's Siri and Microsoft Cortana are increasingly important. Instead of passively reacting to queries, they provide users with brand new proactive experiences that aim to offer the right information at the right time. It is, therefore, crucial for personal assistants to understand users' intent, that is, what information users need now. Intent is closely related to context. Various contextual signals, including spatio-temporal information and users' activities, can signify users' intent. It is, however, challenging to model the correlation between intent and context. Intent and context are highly dynamic and often sequentially correlated. Contextual signals are usually sparse, heterogeneous, and not simultaneously available. We propose an innovative collaborative nowcasting model to jointly address all these issues. The model effectively addresses the complex sequential and concurring correlation between context and intent and recognizes users' real-time intent with continuously arrived contextual signals. We extensively evaluate the proposed model with real-world data sets from a commercial personal assistant. The results validate the effectiveness the proposed model, and demonstrate its capability of handling the real-time flow of contextual signals. The studied problem and model also provide inspiring implications for new paradigms of recommendation on mobile intelligent devices.", acknowledgement = ack-nhfb, articleno = "30", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Li:2017:TAP, author = "Xin Li and Mingming Jiang and Huiting Hong and Lejian Liao", title = "A Time-Aware Personalized Point-of-Interest Recommendation via High-Order Tensor Factorization", journal = j-TOIS, volume = "35", number = "4", pages = "31:1--31:??", month = aug, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3057283", ISSN = "1046-8188", bibdate = "Tue Jan 16 07:16:46 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Recently, location-based services (LBSs) have been increasingly popular for people to experience new possibilities, for example, personalized point-of-interest (POI) recommendations that leverage on the overlapping of user trajectories to recommend POI collaboratively. POI recommendation is yet challenging as it suffers from the problems known for the conventional recommendation tasks such as data sparsity and cold start, and to a much greater extent. In the literature, most of the related works apply collaborate filtering to POI recommendation while overlooking the personalized time-variant human behavioral tendency. In this article, we put forward a fourth-order tensor factorization-based ranking methodology to recommend users their interested locations by considering their time-varying behavioral trends while capturing their long-term preferences and short-term preferences simultaneously. We also propose to categorize the locations to alleviate data sparsity and cold-start issues, and accordingly new POIs that users have not visited can thus be bubbled up during the category ranking process. The tensor factorization is carefully studied to prune the irrelevant factors to the ranking results to achieve efficient POI recommendations. The experimental results validate the efficacy of our proposed mechanism, which outperforms the state-of-the-art approaches significantly.", acknowledgement = ack-nhfb, articleno = "31", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{He:2017:MEB, author = "Jiangning He and Hongyan Liu", title = "Mining Exploratory Behavior to Improve Mobile App Recommendations", journal = j-TOIS, volume = "35", number = "4", pages = "32:1--32:??", month = aug, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3072588", ISSN = "1046-8188", bibdate = "Tue Jan 16 07:16:46 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "With the widespread usage of smart phones, more and more mobile apps are developed every day, playing an increasingly important role in changing our lifestyles and business models. In this trend, it becomes a hot research topic for developing effective mobile app recommender systems in both industry and academia. Compared with existing studies about mobile app recommendations, our research aims to improve the recommendation effectiveness based on analyzing a psychological trait of human beings, exploratory behavior, which refers to a type of variety-seeking behavior in unfamiliar domains. To this end, we propose a novel probabilistic model named Goal-oriented Exploratory Model (GEM), integrating exploratory behavior identification with personalized item recommendation. An algorithm combining collapsed Gibbs sampling and Expectation Maximization is developed for model learning and inference. Through extensive experiments conducted on a real dataset, the proposed model demonstrates superior recommendation performances and good interpretability compared with state-of-art recommendation methods. Moreover, empirical analyses on exploratory behavior find that individuals with a strong exploratory tendency exhibit behavioral patterns of variety seeking, risk taking, and higher involvement. Besides, mobile apps that are less popular or in the long tail possess greater potential of arousing exploratory behavior in individuals.", acknowledgement = ack-nhfb, articleno = "32", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Bradesko:2017:CCM, author = "Luka Bradesko and Michael Witbrock and Janez Starc and Zala Herga and Marko Grobelnik and Dunja Mladeni{\'c}", title = "Curious Cat-Mobile, Context-Aware Conversational Crowdsourcing Knowledge Acquisition", journal = j-TOIS, volume = "35", number = "4", pages = "33:1--33:??", month = aug, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3086686", ISSN = "1046-8188", bibdate = "Tue Jan 16 07:16:46 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Scaled acquisition of high-quality structured knowledge has been a longstanding goal of Artificial Intelligence research. Recent advances in crowdsourcing, the sheer number of Internet and mobile users, and the commercial availability of supporting platforms offer new tools for knowledge acquisition. This article applies context-aware knowledge acquisition that simultaneously satisfies users' immediate information needs while extending its own knowledge using crowdsourcing. The focus is on knowledge acquisition on a mobile device, which makes the approach practical and scalable; in this context, we propose and implement a new KA approach that exploits an existing knowledge base to drive the KA process, communicate with the right people, and check for consistency of the user-provided answers. We tested the viability of the approach in experiments using our platform with real users around the world, and an existing large source of common-sense background knowledge. These experiments show that the approach is promising: the knowledge is estimated to be true and useful for users 95\% of the time. Using context to proactively drive knowledge acquisition increased engagement and effectiveness (the number of new assertions/day/user increased for 175\%). Using pre-existing and newly acquired knowledge also proved beneficial.", acknowledgement = ack-nhfb, articleno = "33", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Umemoto:2017:SSU, author = "Kazutoshi Umemoto and Ruihua Song and Jian-Yun Nie and Xing Xie and Katsumi Tanaka and Yong Rui", title = "Search by Screenshots for Universal Article Clipping in Mobile Apps", journal = j-TOIS, volume = "35", number = "4", pages = "34:1--34:??", month = aug, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3091107", ISSN = "1046-8188", bibdate = "Tue Jan 16 07:16:46 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "To address the difficulty in clipping articles from various mobile applications (apps), we propose a novel framework called UniClip, which allows a user to snap a screen of an article to save the whole article in one place. The key task of the framework is search by screenshots, which has three challenges: (1) how to represent a screenshot; (2) how to formulate queries for effective article retrieval; and (3) how to identify the article from search results. We solve these by (1) segmenting a screenshot into structural units called blocks, (2) formulating effective search queries by considering the role of each block, and (3) aggregating the search result lists of multiple queries. To improve efficiency, we also extend our approach with learning-to-rank techniques so that we can find the desired article with only one query. Experimental results show that our approach achieves high retrieval performance ($ F_1 = 0.868$), which outperforms baselines based on keyword extraction and chunking methods. Learning-to-rank models improve our approach without learning by about 6\%. A user study conducted to investigate the usability of UniClip reveals that ours is preferred by 21 out of 22 participants for its simplicity and effectiveness.", acknowledgement = ack-nhfb, articleno = "34", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Dong:2017:UMD, author = "Yuxiao Dong and Nitesh V. Chawla and Jie Tang and Yang Yang and Yang Yang", title = "User Modeling on Demographic Attributes in Big Mobile Social Networks", journal = j-TOIS, volume = "35", number = "4", pages = "35:1--35:??", month = aug, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3057278", ISSN = "1046-8188", bibdate = "Tue Jan 16 07:16:46 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Users with demographic profiles in social networks offer the potential to understand the social principles that underpin our highly connected world, from individuals, to groups, to societies. In this article, we harness the power of network and data sciences to model the interplay between user demographics and social behavior and further study to what extent users' demographic profiles can be inferred from their mobile communication patterns. By modeling over 7 million users and 1 billion mobile communication records, we find that during the active dating period (i.e., 18--35 years old), users are active in broadening social connections with males and females alike, while after reaching 35 years of age people tend to keep small, closed, and same-gender social circles. Further, we formalize the demographic prediction problem of inferring users' gender and age simultaneously. We propose a factor graph-based WhoAmI method to address the problem by leveraging not only the correlations between network features and users' gender/age, but also the interrelations between gender and age. In addition, we identify a new problem-coupled network demographic prediction across multiple mobile operators-and present a coupled variant of the WhoAmI method to address its unique challenges. Our extensive experiments demonstrate the effectiveness, scalability, and applicability of the WhoAmI methods. Finally, our study finds a greater than 80\% potential predictability for inferring users' gender from phone call behavior and 73\% for users' age from text messaging interactions.", acknowledgement = ack-nhfb, articleno = "35", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Yang:2017:NNA, author = "Cheng Yang and Maosong Sun and Wayne Xin Zhao and Zhiyuan Liu and Edward Y. Chang", title = "A Neural Network Approach to Jointly Modeling Social Networks and Mobile Trajectories", journal = j-TOIS, volume = "35", number = "4", pages = "36:1--36:??", month = aug, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3041658", ISSN = "1046-8188", bibdate = "Tue Jan 16 07:16:46 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Two characteristics of location-based services are mobile trajectories and the ability to facilitate social networking. The recording of trajectory data contributes valuable resources towards understanding users' geographical movement behaviors. Social networking is possible when users are able to quickly connect to anyone nearby. A social network with location based services is known as location-based social network (LBSN). As shown in Cho et al. [2013], locations that are frequently visited by socially related persons tend to be correlated, which indicates the close association between social connections and trajectory behaviors of users in LBSNs. To better analyze and mine LBSN data, we need to have a comprehensive view of each of these two aspects, i.e., the mobile trajectory data and the social network. Specifically, we present a novel neural network model that can jointly model both social networks and mobile trajectories. Our model consists of two components: the construction of social networks and the generation of mobile trajectories. First we adopt a network embedding method for the construction of social networks: a networking representation can be derived for a user. The key to our model lies in generating mobile trajectories. Second, we consider four factors that influence the generation process of mobile trajectories: user visit preference, influence of friends, short-term sequential contexts, and long-term sequential contexts. To characterize the last two contexts, we employ the RNN and GRU models to capture the sequential relatedness in mobile trajectories at the short or long term levels. Finally, the two components are tied by sharing the user network representations. Experimental results on two important applications demonstrate the effectiveness of our model. In particular, the improvement over baselines is more significant when either network structure or trajectory data is sparse.", acknowledgement = ack-nhfb, articleno = "36", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Cao:2017:CPA, author = "Da Cao and Xiangnan He and Liqiang Nie and Xiaochi Wei and Xia Hu and Shunxiang Wu and Tat-Seng Chua", title = "Cross-Platform App Recommendation by Jointly Modeling Ratings and Texts", journal = j-TOIS, volume = "35", number = "4", pages = "37:1--37:??", month = aug, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3017429", ISSN = "1046-8188", bibdate = "Tue Jan 16 07:16:46 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Over the last decade, the renaissance of Web technologies has transformed the online world into an application (App) driven society. While the abundant Apps have provided great convenience, their sheer number also leads to severe information overload, making it difficult for users to identify desired Apps. To alleviate the information overloading issue, recommender systems have been proposed and deployed for the App domain. However, existing work on App recommendation has largely focused on one single platform (e.g., smartphones), while it ignores the rich data of other relevant platforms (e.g., tablets and computers). In this article, we tackle the problem of cross-platform App recommendation, aiming at leveraging users' and Apps' data on multiple platforms to enhance the recommendation accuracy. The key advantage of our proposal is that by leveraging multiplatform data, the perpetual issues in personalized recommender systems-data sparsity and cold-start-can be largely alleviated. To this end, we propose a hybrid solution, STAR (short for ``croSs-plaTform App Recommendation'') that integrates both numerical ratings and textual content from multiple platforms. In STAR, we innovatively represent an App as an aggregation of common features across platforms (e.g., App's functionalities) and specific features that are dependent on the resided platform. In light of this, STAR can discriminate a user's preference on an App by separating the user's interest into two parts (either in the App's inherent factors or platform-aware features). To evaluate our proposal, we construct two real-world datasets that are crawled from the App stores of iPhone, iPad, and iMac. Through extensive experiments, we show that our STAR method consistently outperforms highly competitive recommendation methods, justifying the rationality of our cross-platform App recommendation proposal and the effectiveness of our solution.", acknowledgement = ack-nhfb, articleno = "37", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Yao:2017:VAR, author = "Yuan Yao and Wayne Xin Zhao and Yaojing Wang and Hanghang Tong and Feng Xu and Jian Lu", title = "Version-Aware Rating Prediction for Mobile App Recommendation", journal = j-TOIS, volume = "35", number = "4", pages = "38:1--38:??", month = aug, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3015458", ISSN = "1046-8188", bibdate = "Tue Jan 16 07:16:46 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "With the great popularity of mobile devices, the amount of mobile apps has grown at a more dramatic rate than ever expected. A technical challenge is how to recommend suitable apps to mobile users. In this work, we identify and focus on a unique characteristic that exists in mobile app recommendation-that is, an app usually corresponds to multiple release versions. Based on this characteristic, we propose a fine-grain version-aware app recommendation problem. Instead of directly learning the users' preferences over the apps, we aim to infer the ratings of users on a specific version of an app. However, the user-version rating matrix will be sparser than the corresponding user-app rating matrix, making existing recommendation methods less effective. In view of this, our approach has made two major extensions. First, we leverage the review text that is associated with each rating record; more importantly, we consider two types of version-based correlations. The first type is to capture the temporal correlations between multiple versions within the same app, and the second type of correlation is to capture the aggregation correlations between similar apps. Experimental results on a large dataset demonstrate the superiority of our approach over several competitive methods.", acknowledgement = ack-nhfb, articleno = "38", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Liu:2017:DUP, author = "Xuanzhe Liu and Wei Ai and Huoran Li and Jian Tang and Gang Huang and Feng Feng and Qiaozhu Mei", title = "Deriving User Preferences of Mobile Apps from Their Management Activities", journal = j-TOIS, volume = "35", number = "4", pages = "39:1--39:??", month = aug, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3015462", ISSN = "1046-8188", bibdate = "Tue Jan 16 07:16:46 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "App marketplaces host millions of mobile apps that are downloaded billions of times. Investigating how people manage mobile apps in their everyday lives creates a unique opportunity to understand the behavior and preferences of mobile device users, infer the quality of apps, and improve user experience. Existing literature provides very limited knowledge about app management activities, due to the lack of app usage data at scale. This article takes the initiative to analyze a very large app management log collected through a leading Android app marketplace. The dataset covers 5 months of detailed downloading, updating, and uninstallation activities, which involve 17 million anonymized users and 1 million apps. We present a surprising finding that the metrics commonly used to rank apps in app stores do not truly reflect the users' real attitudes. We then identify behavioral patterns from the app management activities that more accurately indicate user preferences of an app even when no explicit rating is available. A systematic statistical analysis is designed to evaluate machine learning models that are trained to predict user preferences using these behavioral patterns, which features an inverse probability weighting method to correct the selection biases in the training process.", acknowledgement = ack-nhfb, articleno = "39", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Wang:2017:CUT, author = "Senzhang Wang and Xiaoming Zhang and Jianping Cao and Lifang He and Leon Stenneth and Philip S. Yu and Zhoujun Li and Zhiqiu Huang", title = "Computing Urban Traffic Congestions by Incorporating Sparse {GPS} Probe Data and Social Media Data", journal = j-TOIS, volume = "35", number = "4", pages = "40:1--40:??", month = aug, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3057281", ISSN = "1046-8188", bibdate = "Tue Jan 16 07:16:46 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Estimating urban traffic conditions of an arterial network with GPS probe data is a practically important while substantially challenging problem, and has attracted increasing research interests recently. Although GPS probe data is becoming a ubiquitous data source for various traffic related applications currently, they are usually insufficient for fully estimating traffic conditions of a large arterial network due to the low sampling frequency. To explore other data sources for more effectively computing urban traffic conditions, we propose to collect various traffic events such as traffic accident and jam from social media as complementary information. In addition, to further explore other factors that might affect traffic conditions, we also extract rich auxiliary information including social events, road features, Point of Interest (POI), and weather. With the enriched traffic data and auxiliary information collected from different sources, we first study the traffic co-congestion pattern mining problem with the aim of discovering which road segments geographically close to each other are likely to co-occur traffic congestion. A search tree based approach is proposed to efficiently discover the co-congestion patterns. These patterns are then used to help estimate traffic congestions and detect anomalies in a transportation network. To fuse the multisourced data, we finally propose a coupled matrix and tensor factorization model named TCE\_R to more accurately complete the sparse traffic congestion matrix by collaboratively factorizing it with other matrices and tensors formed by other data. We evaluate the proposed model on the arterial network of downtown Chicago with 1,257 road segments whose total length is nearly 700 miles. The results demonstrate the superior performance of TCE\_R by comprehensive comparison with existing approaches.", acknowledgement = ack-nhfb, articleno = "40", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Song:2017:DLD, author = "Xuan Song and Ryosuke Shibasaki and Nicholos Jing Yuan and Xing Xie and Tao Li and Ryutaro Adachi", title = "{DeepMob}: Learning Deep Knowledge of Human Emergency Behavior and Mobility from Big and Heterogeneous Data", journal = j-TOIS, volume = "35", number = "4", pages = "41:1--41:??", month = aug, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3057280", ISSN = "1046-8188", bibdate = "Tue Jan 16 07:16:46 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The frequency and intensity of natural disasters has increased significantly in recent decades, and this trend is expected to continue. Hence, understanding and predicting human evacuation behavior and mobility will play a vital role in planning effective humanitarian relief, disaster management, and long-term societal reconstruction. However, existing models are shallow models, and it is difficult to apply them for understanding the ``deep knowledge'' of human mobility. Therefore, in this study, we collect big and heterogeneous data (e.g., GPS records of 1.6 million users over 3 years, data on earthquakes that have occurred in Japan over 4 years, news report data, and transportation network data), and we build an intelligent system, namely, DeepMob, for understanding and predicting human evacuation behavior and mobility following different types of natural disasters. The key component of DeepMob is based on a deep learning architecture that aims to understand the basic laws that govern human behavior and mobility following natural disasters, from big and heterogeneous data. Furthermore, based on the deep learning model, DeepMob can accurately predict or simulate a person's future evacuation behaviors or evacuation routes under different disaster conditions. Experimental results and validations demonstrate the efficiency and superior performance of our system, and suggest that human mobility following disasters may be predicted and simulated more easily than previously thought.", acknowledgement = ack-nhfb, articleno = "41", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Farseev:2017:TCF, author = "Aleksandr Farseev and Tat-Seng Chua", title = "Tweet Can Be Fit: Integrating Data from Wearable Sensors and Multiple Social Networks for Wellness Profile Learning", journal = j-TOIS, volume = "35", number = "4", pages = "42:1--42:??", month = aug, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3086676", ISSN = "1046-8188", bibdate = "Tue Jan 16 07:16:46 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Wellness is a widely popular concept that is commonly applied to fitness and self-help products or services. Inference of personal wellness--related attributes, such as body mass index (BMI) category or disease tendency, as well as understanding of global dependencies between wellness attributes and users' behavior, is of crucial importance to various applications in personal and public wellness domains. At the same time, the emergence of social media platforms and wearable sensors makes it feasible to perform wellness profiling for users from multiple perspectives. However, research efforts on wellness profiling and integration of social media and sensor data are relatively sparse. This study represents one of the first attempts in this direction. Specifically, we infer personal wellness attributes by utilizing our proposed multisource multitask wellness profile learning framework-WellMTL-which can handle data incompleteness and perform wellness attributes inference from sensor and social media data simultaneously. To gain insights into the data at a global level, we also examine correlations between first-order data representations and personal wellness attributes. Our experimental results show that the integration of sensor data and multiple social media sources can substantially boost the performance of individual wellness profiling.", acknowledgement = ack-nhfb, articleno = "42", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Wang:2017:UPP, author = "Haoyu Wang and Yuanchun Li and Yao Guo and Yuvraj Agarwal and Jason I. Hong", title = "Understanding the Purpose of Permission Use in Mobile Apps", journal = j-TOIS, volume = "35", number = "4", pages = "43:1--43:??", month = aug, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3086677", ISSN = "1046-8188", bibdate = "Tue Jan 16 07:16:46 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Mobile apps frequently request access to sensitive data, such as location and contacts. Understanding the purpose of why sensitive data is accessed could help improve privacy as well as enable new kinds of access control. In this article, we propose a text mining based method to infer the purpose of sensitive data access by Android apps. The key idea we propose is to extract multiple features from app code and then use those features to train a machine learning classifier for purpose inference. We present the design, implementation, and evaluation of two complementary approaches to infer the purpose of permission use, first using purely static analysis, and then using primarily dynamic analysis. We also discuss the pros and cons of both approaches and the trade-offs involved.", acknowledgement = ack-nhfb, articleno = "43", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Alkwai:2017:CAR, author = "Lulwah M. Alkwai and Michael L. Nelson and Michele C. Weigle", title = "Comparing the Archival Rate of {Arabic}, {English}, {Danish}, and {Korean} Language {Web} Pages", journal = j-TOIS, volume = "36", number = "1", pages = "1:1--1:??", month = aug, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3041656", ISSN = "1046-8188", bibdate = "Tue Jan 16 07:16:47 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "It has long been suspected that web archives and search engines favor Western and English language webpages. In this article, we quantitatively explore how well indexed and archived Arabic language webpages are as compared to those from other languages. We began by sampling 15,092 unique URIs from three different website directories: DMOZ (multilingual), Raddadi, and Star28 (the last two primarily Arabic language). Using language identification tools, we eliminated pages not in the Arabic language (e.g., English-language versions of Aljazeera pages) and culled the collection to 7,976 Arabic language webpages. We then used these 7,976 pages and crawled the live web and web archives to produce a collection of 300,646 Arabic language pages. We compared the analysis of Arabic language pages with that of English, Danish, and Korean language pages. First, for each language, we sampled unique URIs from DMOZ; then, using language identification tools, we kept only pages in the desired language. Finally, we crawled the archived and live web to collect a larger sample of pages in English, Danish, or Korean. In total for the four languages, we analyzed over 500,000 webpages. We discovered: (1) English has a higher archiving rate than Arabic, with 72.04\% archived. However, Arabic has a higher archiving rate than Danish and Korean, with 53.36\% of Arabic URIs archived, followed by Danish and Korean with 35.89\% and 32.81\% archived, respectively. (2) Most Arabic and English language pages are located in the United States; only 14.84\% of the Arabic URIs had an Arabic country code top-level domain (e.g., sa) and only 10.53\% had a GeoIP in an Arabic country. Most Danish-language pages were located in Denmark, and most Korean-language pages were located in South Korea. (3) The presence of a webpage in a directory positively impacts indexing and presence in the DMOZ directory, specifically, positively impacts archiving in all four languages. In this work, we show that web archives and search engines favor English pages. However, it is not universally true for all Western-language webpages because, in this work, we show that Arabic webpages have a higher archival rate than Danish language webpages.", acknowledgement = ack-nhfb, articleno = "1", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Pibiri:2017:CEF, author = "Giulio Ermanno Pibiri and Rossano Venturini", title = "Clustered {Elias--Fano} Indexes", journal = j-TOIS, volume = "36", number = "1", pages = "2:1--2:??", month = aug, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3052773", ISSN = "1046-8188", bibdate = "Tue Jan 16 07:16:47 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "State-of-the-art encoders for inverted indexes compress each posting list individually. Encoding clusters of posting lists offers the possibility of reducing the redundancy of the lists while maintaining a noticeable query processing speed. In this article, we propose a new index representation based on clustering the collection of posting lists and, for each created cluster, building an ad hoc reference list with respect to which all lists in the cluster are encoded with Elias-Fano. We describe a posting lists clustering algorithm tailored for our encoder and two methods for building the reference list for a cluster. Both approaches are heuristic and differ in the way postings are added to the reference list: according to their frequency in the cluster or according to the number of bits necessary for their representation. The extensive experimental analysis indicates that significant space reductions are indeed possible, beating the best state-of-the-art encoders.", acknowledgement = ack-nhfb, articleno = "2", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Jiang:2017:GGS, author = "Jiawei Jiang and Yunhai Tong and Hua Lu and Bin Cui and Kai Lei and Lele Yu", title = "{GVoS}: a General System for Near-Duplicate Video-Related Applications on Storm", journal = j-TOIS, volume = "36", number = "1", pages = "3:1--3:??", month = aug, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3041657", ISSN = "1046-8188", bibdate = "Tue Jan 16 07:16:47 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The exponential increase of online videos greatly enriches the life of users but also brings huge numbers of near-duplicate videos (NDVs) that seriously challenge the video websites. The video websites entail NDV-related applications such as detection of copyright violation, video monitoring, video re-ranking, and video recommendation. Since these applications adopt different features and different processing procedures due to diverse scenarios, constructing separate and special-purpose systems for them incurs considerable costs on design, implementation, and maintenance. In this article, we propose a general NDV system on Storm (GVoS)-a popular distributed real-time stream processing platform-to simultaneously support a wide variety of video applications. The generality of GVoS is achieved in two aspects. First, we extract the reusable components from various applications. Second, we conduct the communication between components via a mechanism called Stream Shared Message (SSM) that contains the video-related data. Furthermore, we present an algorithm to reduce the size of SSM in order to avoid the data explosion and decrease the network latency. The experimental results demonstrate that GVoS can achieve performance almost the same as the customized systems. Meanwhile, GVoS accomplishes remarkably higher systematic versatility and efficiently facilitates the development of various NDV-related applications.", acknowledgement = ack-nhfb, articleno = "3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Wang:2017:UVP, author = "Xiang Wang and Liqiang Nie and Xuemeng Song and Dongxiang Zhang and Tat-Seng Chua", title = "Unifying Virtual and Physical Worlds: Learning Toward Local and Global Consistency", journal = j-TOIS, volume = "36", number = "1", pages = "4:1--4:??", month = aug, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3052774", ISSN = "1046-8188", bibdate = "Tue Jan 16 07:16:47 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Event-based social networking services, such as Meetup, are capable of linking online virtual interactions to offline physical activities. Compared to mono online social networking services (e.g., Twitter and Google+), such dual networks provide a complete picture of users' online and offline behaviors that more often than not are compatible and complementary. In the light of this, we argue that joint learning over dual networks offers us a better way to comprehensively understand user behaviors and their underlying organizational principles. Despite its value, few efforts have been dedicated to jointly considering the following factors within a unified model: (1) local user contextualization, (2) global structure coherence, and (3) effectiveness evaluation. Toward this end, we propose a novel dual clustering model for community detection over dual networks to jointly model local consistency for a specific user and global consistency of partitioning results across networks. We theoretically derived its solution. In addition, we verified our model regarding multiple metrics from different aspects and applied it to the application of event attendance prediction.", acknowledgement = ack-nhfb, articleno = "4", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Shirakawa:2017:IWG, author = "Masumi Shirakawa and Takahiro Hara and Shojiro Nishio", title = "{IDF} for Word {$N$}-grams", journal = j-TOIS, volume = "36", number = "1", pages = "5:1--5:??", month = aug, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3052775", ISSN = "1046-8188", bibdate = "Tue Jan 16 07:16:47 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Inverse Document Frequency (IDF) is widely accepted term weighting scheme whose robustness is supported by many theoretical justifications. However, applying IDF to word N-grams (or simply N-grams) of any length without relying on heuristics has remained a challenging issue. This article describes a theoretical extension of IDF to handle N-grams. First, we elucidate the theoretical relationship between IDF and information distance, a universal metric defined by the Kolmogorov complexity. Based on our understanding of this relationship, we propose N-gram IDF, a new IDF family that gives fair weights to words and phrases of any length. Based only on the magnitude relation of N-gram IDF weights, dominant N-grams among overlapping N-grams can be determined. We also propose an efficient method to compute the N-gram IDF weights of all N-grams by leveraging the enhanced suffix array and wavelet tree. Because the exact computation of N-gram IDF provably requires significant computational cost, we modify it to a fast approximation method that can estimate weight errors analytically and maintain application-level performance. Empirical evaluations with unsupervised/supervised key term extraction and web search query segmentation with various experimental settings demonstrate the robustness and language-independent nature of the proposed N-gram IDF.", acknowledgement = ack-nhfb, articleno = "5", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Vardasbi:2017:SSW, author = "Ali Vardasbi and Heshaam Faili and Masoud Asadpour", title = "{SWIM}: Stepped Weighted Shell Decomposition Influence Maximization for Large-Scale Networks", journal = j-TOIS, volume = "36", number = "1", pages = "6:1--6:??", month = aug, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3072652", ISSN = "1046-8188", bibdate = "Tue Jan 16 07:16:47 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "A considerable amount of research has been devoted to the proposition of scalable algorithms for influence maximization. A number of such scalable algorithms exploit the community structure of the network. Besides the community structure, real-world social networks possess a different property, known as the layer structure. In this article, we propose a method based on the layer structure to maximize the influence in huge networks. Conducting experiments on a number of real-world networks, we will show that our method outperforms the state-of-the-art algorithms by its time complexity while having similar or slightly better final influence spread. Furthermore, unlike its predecessors, our method is able to show a high entanglement between structure and dynamics by giving insight on the reason why different networks have two contrasting behaviors in their saturation. By ``saturation,'' we mean a state during the seed selection process after which adjoining new nodes to the initial set will have a negligible effect on increasing the influence spread. We will demonstrate that how our method can predict the saturation dynamics in the networks. This prediction can be used to identify the network structures that are more vulnerable to the fast spread of the rumors.", acknowledgement = ack-nhfb, articleno = "6", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Yang:2017:YMP, author = "Longqi Yang and Cheng-Kang Hsieh and Hongjian Yang and John P. Pollak and Nicola Dell and Serge Belongie and Curtis Cole and Deborah Estrin", title = "{Yum-Me}: a Personalized Nutrient-Based Meal Recommender System", journal = j-TOIS, volume = "36", number = "1", pages = "7:1--7:??", month = aug, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3072614", ISSN = "1046-8188", bibdate = "Tue Jan 16 07:16:47 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Nutrient-based meal recommendations have the potential to help individuals prevent or manage conditions such as diabetes and obesity. However, learning people's food preferences and making recommendations that simultaneously appeal to their palate and satisfy nutritional expectations are challenging. Existing approaches either only learn high-level preferences or require a prolonged learning period. We propose Yum-me, a personalized nutrient-based meal recommender system designed to meet individuals' nutritional expectations, dietary restrictions, and fine-grained food preferences. Yum-me enables a simple and accurate food preference profiling procedure via a visual quiz-based user interface and projects the learned profile into the domain of nutritionally appropriate food options to find ones that will appeal to the user. We present the design and implementation of Yum-me and further describe and evaluate two innovative contributions. The first contribution is an open source state-of-the-art food image analysis model, named FoodDist. We demonstrate FoodDist's superior performance through careful benchmarking and discuss its applicability across a wide array of dietary applications. The second contribution is a novel online learning framework that learns food preference from itemwise and pairwise image comparisons. We evaluate the framework in a field study of 227 anonymous users and demonstrate that it outperforms other baselines by a significant margin. We further conducted an end-to-end validation of the feasibility and effectiveness of Yum-me through a 60-person user study, in which Yum-me improves the recommendation acceptance rate by 42.63\%.", acknowledgement = ack-nhfb, articleno = "7", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Liang:2017:SRD, author = "Shangsong Liang and Emine Yilmaz and Hong Shen and Maarten {De Rijke} and W. Bruce Croft", title = "Search Result Diversification in Short Text Streams", journal = j-TOIS, volume = "36", number = "1", pages = "8:1--8:??", month = aug, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3057282", ISSN = "1046-8188", bibdate = "Tue Jan 16 07:16:47 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "We consider the problem of search result diversification for streams of short texts. Diversifying search results in short text streams is more challenging than in the case of long documents, as it is difficult to capture the latent topics of short documents. To capture the changes of topics and the probabilities of documents for a given query at a specific time in a short text stream, we propose a dynamic Dirichlet multinomial mixture topic model, called D2M3, as well as a Gibbs sampling algorithm for the inference. We also propose a streaming diversification algorithm, SDA, that integrates the information captured by D2M3 with our proposed modified version of the PM-2 (Proportionality-based diversification Method --- second version) diversification algorithm. We conduct experiments on a Twitter dataset and find that SDA statistically significantly outperforms state-of-the-art non-streaming retrieval methods, plain streaming retrieval methods, as well as streaming diversification methods that use other dynamic topic models.", acknowledgement = ack-nhfb, articleno = "8", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Hou:2017:LAC, author = "Lei Hou and Juanzi Li and Xiao-Li Li and Jie Tang and Xiaofei Guo", title = "Learning to Align Comments to News Topics", journal = j-TOIS, volume = "36", number = "1", pages = "9:1--9:??", month = aug, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3072591", ISSN = "1046-8188", bibdate = "Tue Jan 16 07:16:47 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "With the rapid proliferation of social media, increasingly more people express their opinions and reviews (user-generated content (UGC)) on recent news articles through various online services, such as news portals, forums, discussion groups, and microblogs. Clearly, identifying hot topics that users greatly care about can improve readers' news browsing experience and facilitate research into interaction analysis between news and UGC. Furthermore, it is of great benefit to public opinion monitoring and management for both industry and government agencies. However, it is extremely time consuming, if not impossible, to manually examine the large amount of available social content. In this article, we formally define the news comment alignment problem and propose a novel framework that: (1) automatically extracts topics from a given news article and its associated comments, (2) identifies and extends positive examples with different degrees of confidence using three methods (i.e., hypersphere, density, and cluster chain), and (3) completes the alignment between news sentences and comments through a weighted-SVM classifier. Extensive experiments show that our proposed framework significantly outperforms state-of-the-art methods.", acknowledgement = ack-nhfb, articleno = "9", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Liang:2017:IDU, author = "Shangsong Liang and Zhaochun Ren and Yukun Zhao and Jun Ma and Emine Yilmaz and Maarten {De Rijke}", title = "Inferring Dynamic User Interests in Streams of Short Texts for User Clustering", journal = j-TOIS, volume = "36", number = "1", pages = "10:1--10:??", month = aug, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3072606", ISSN = "1046-8188", bibdate = "Tue Jan 16 07:16:47 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "User clustering has been studied from different angles. In order to identify shared interests, behavior-based methods consider similar browsing or search patterns of users, whereas content-based methods use information from the contents of the documents visited by the users. So far, content-based user clustering has mostly focused on static sets of relatively long documents. Given the dynamic nature of social media, there is a need to dynamically cluster users in the context of streams of short texts. User clustering in this setting is more challenging than in the case of long documents, as it is difficult to capture the users' dynamic topic distributions in sparse data settings. To address this problem, we propose a dynamic user clustering topic model (UCT). UCT adaptively tracks changes of each user's time-varying topic distributions based both on the short texts the user posts during a given time period and on previously estimated distributions. To infer changes, we propose a Gibbs sampling algorithm where a set of word pairs from each user is constructed for sampling. UCT can be used in two ways: (1) as a short-term dependency model that infers a user's current topic distribution based on the user's topic distributions during the previous time period only, and (2) as a long-term dependency model that infers a user's current topic distributions based on the user's topic distributions during multiple time periods in the past. The clustering results are explainable and human-understandable, in contrast to many other clustering algorithms. For evaluation purposes, we work with a dataset consisting of users and tweets from each user. Experimental results demonstrate the effectiveness of our proposed short-term and long-term dependency user clustering models compared to state-of-the-art baselines.", acknowledgement = ack-nhfb, articleno = "10", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Li:2017:ETM, author = "Chenliang Li and Yu Duan and Haoran Wang and Zhiqian Zhang and Aixin Sun and Zongyang Ma", title = "Enhancing Topic Modeling for Short Texts with Auxiliary Word Embeddings", journal = j-TOIS, volume = "36", number = "2", pages = "11:1--11:??", month = sep, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3091108", ISSN = "1046-8188", bibdate = "Tue Jan 16 07:16:47 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Many applications require semantic understanding of short texts, and inferring discriminative and coherent latent topics is a critical and fundamental task in these applications. Conventional topic models largely rely on word co-occurrences to derive topics from a collection of documents. However, due to the length of each document, short texts are much more sparse in terms of word co-occurrences. Recent studies show that the Dirichlet Multinomial Mixture (DMM) model is effective for topic inference over short texts by assuming that each piece of short text is generated by a single topic. However, DMM has two main limitations. First, even though it seems reasonable to assume that each short text has only one topic because of its shortness, the definition of ``shortness'' is subjective and the length of the short texts is dataset dependent. That is, the single-topic assumption may be too strong for some datasets. To address this limitation, we propose to model the topic number as a Poisson distribution, allowing each short text to be associated with a small number of topics (e.g., one to three topics). This model is named PDMM. Second, DMM (and also PDMM) does not have access to background knowledge (e.g., semantic relations between words) when modeling short texts. When a human being interprets a piece of short text, the understanding is not solely based on its content words, but also their semantic relations. Recent advances in word embeddings offer effective learning of word semantic relations from a large corpus. Such auxiliary word embeddings enable us to address the second limitation. To this end, we propose to promote the semantically related words under the same topic during the sampling process, by using the generalized P{\'o}lya urn (GPU) model. Through the GPU model, background knowledge about word semantic relations learned from millions of external documents can be easily exploited to improve topic modeling for short texts. By directly extending the PDMM model with the GPU model, we propose two more effective topic models for short texts, named GPU-DMM and GPU-PDMM. Through extensive experiments on two real-world short text collections in two languages, we demonstrate that PDMM achieves better topic representations than state-of-the-art models, measured by topic coherence. The learned topic representation leads to better accuracy in a text classification task, as an indirect evaluation. Both GPU-DMM and GPU-PDMM further improve topic coherence and text classification accuracy. GPU-PDMM outperforms GPU-DMM at the price of higher computational costs.", acknowledgement = ack-nhfb, articleno = "11", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Voorhees:2017:URI, author = "Ellen M. Voorhees and Daniel Samarov and Ian Soboroff", title = "Using Replicates in Information Retrieval Evaluation", journal = j-TOIS, volume = "36", number = "2", pages = "12:1--12:??", month = sep, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3086701", ISSN = "1046-8188", bibdate = "Tue Jan 16 07:16:47 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "This article explores a method for more accurately estimating the main effect of the system in a typical test-collection-based evaluation of information retrieval systems, thus increasing the sensitivity of system comparisons. Randomly partitioning the test document collection allows for multiple tests of a given system and topic (replicates). Bootstrap ANOVA can use these replicates to extract system-topic interactions-something not possible without replicates-yielding a more precise value for the system effect and a narrower confidence interval around that value. Experiments using multiple TREC collections demonstrate that removing the topic-system interactions substantially reduces the confidence intervals around the system effect as well as increases the number of significant pairwise differences found. Further, the method is robust against small changes in the number of partitions used, against variability in the documents that constitute the partitions, and the measure of effectiveness used to quantify system effectiveness.", acknowledgement = ack-nhfb, articleno = "12", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Zhang:2017:FFT, author = "Jing Zhang and Jie Tang and Cong Ma and Hanghang Tong and Yu Jing and Juanzi Li and Walter Luyten and Marie-Francine Moens", title = "Fast and Flexible Top-$k$ Similarity Search on Large Networks", journal = j-TOIS, volume = "36", number = "2", pages = "13:1--13:??", month = sep, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3086695", ISSN = "1046-8188", bibdate = "Tue Jan 16 07:16:47 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Similarity search is a fundamental problem in network analysis and can be applied in many applications, such as collaborator recommendation in coauthor networks, friend recommendation in social networks, and relation prediction in medical information networks. In this article, we propose a sampling-based method using random paths to estimate the similarities based on both common neighbors and structural contexts efficiently in very large homogeneous or heterogeneous information networks. We give a theoretical guarantee that the sampling size depends on the error-bound $ \epsilon $, the confidence level $ (1 - \delta) $, and the path length $T$ of each random walk. We perform an extensive empirical study on a Tencent microblogging network of 1,000,000,000 edges. We show that our algorithm can return top-$k$ similar vertices for any vertex in a network $ 300 \times $ faster than the state-of-the-art methods. We develop a prototype system of recommending similar authors to demonstrate the effectiveness of our method.", acknowledgement = ack-nhfb, articleno = "13", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Nguyen:2017:SIS, author = "Hung T. Nguyen and Preetam Ghosh and Michael L. Mayo and Thang N. Dinh", title = "Social Influence Spectrum at Scale: Near-Optimal Solutions for Multiple Budgets at Once", journal = j-TOIS, volume = "36", number = "2", pages = "14:1--14:??", month = sep, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3086700", ISSN = "1046-8188", bibdate = "Tue Jan 16 07:16:47 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Given a social network, the Influence Maximization (InfMax) problem seeks a seed set of $k$ people that maximizes the expected influence for a viral marketing campaign. However, a solution for a particular seed size $k$ is often not enough to make an informed choice regarding budget and cost-effectiveness. In this article, we propose the computation of Influence Spectrum (InfSpec), the maximum influence at each possible seed set size $k$ within a given range $ [k_{\rm lower}, k_{\rm upper}]$, thus providing optimal decision making for any availability of budget or influence requirements. As none of the existing methods for InfMax are efficient enough for the task in large networks, we propose LISA (sub-Linear Influence Spectrum Approximation), an efficient approximation algorithm for InfSpec (and also InfMax) with the best-known worst-case guarantees for billion-scale networks. LISA returns an $ (1 - 1 / e - \epsilon)$-approximate influence spectrum with high probability $ (1 - \delta)$, where $ \epsilon $, $ \delta $ are precision parameters provided by users. Using statistical decision theory, LISA has an asymptotic optimal running time (in addition to optimal approximation guarantee). In practice, LISA surpasses the state-of-the-art InfMax methods, taking less than 15 minutes to process a network of 41.7 million nodes and 1.5 billions edges.", acknowledgement = ack-nhfb, articleno = "14", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Cai:2017:ALC, author = "Wenbin Cai and Yexun Zhang and Ya Zhang and Siyuan Zhou and Wenquan Wang and Zhuoxiang Chen and Chris Ding", title = "Active Learning for Classification with Maximum Model Change", journal = j-TOIS, volume = "36", number = "2", pages = "15:1--15:??", month = sep, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3086820", ISSN = "1046-8188", bibdate = "Tue Jan 16 07:16:47 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Most existing active learning studies focus on designing sample selection algorithms. However, several fundamental problems deserve investigation to provide deep insight into active learning. In this article, we conduct an in-depth investigation on active learning for classification from the perspective of model change. We derive a general active learning framework for classification called maximum model change (MMC), which aims at querying the influential examples. The model change is quantified as the difference between the model parameters before and after training with the expanded training set. Inspired by the stochastic gradient update rule, the gradient of the loss with respect to a given candidate example is adopted to approximate the model change. This framework is applied to two popular classifiers: support vector machines and logistic regression. We analyze the convergence property of MMC and theoretically justify it. We explore the connection between MMC and uncertainty-based sampling to provide a uniform view. In addition, we discuss its potential usability to other learning models and show its applicability in a wide range of applications. We validate the MMC strategy on two kinds of benchmark datasets, the UCI repository and ImageNet, and show that it outperforms many state-of-the-art methods.", acknowledgement = ack-nhfb, articleno = "15", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Liu:2017:DBE, author = "Ming Liu and Lei Chen and Bingquan Liu and Guidong Zheng and Xiaoming Zhang", title = "{DBpedia}-Based Entity Linking via Greedy Search and Adjusted {Monte Carlo} Random Walk", journal = j-TOIS, volume = "36", number = "2", pages = "16:1--16:??", month = sep, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3086703", ISSN = "1046-8188", bibdate = "Tue Jan 16 07:16:47 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Facing a large amount of entities appearing on the web, entity linking has recently become useful. It assigns an entity from a resource to one name mention to help users grasp the meaning of this name mention. Unfortunately, many possible entities can be assigned to one name mention. Apparently, the usually co-occurring name mentions are related and can be considered together to determine their best assignments. This approach is called collective entity linking and is often conducted based on entity graph. However, traditional collective entity linking methods either consume much time due to the large scale of entity graph or obtain low accuracy due to simplifying graph. To improve both accuracy and efficiency, this article proposes a novel collective entity linking algorithm. It first constructs an entity graph by connecting any two related entities, and then a probability-based objective function is proposed on this graph to ensure the high accuracy of the linking result. Via this function, we convert entity linking to the process of finding the nodes with the highest PageRank Values. Greedy search and an adjusted Monte Carlo random walk are proposed to fulfill this work. Experimental results demonstrate that our algorithm performs much better than traditional linking methods.", acknowledgement = ack-nhfb, articleno = "16", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Peng:2017:PMT, author = "Min Peng and Wang Gao and Hua Wang and Yanchun Zhang and Jiajia Huang and Qianqian Xie and Gang Hu and Gang Tian", title = "Parallelization of Massive Textstream Compression Based on Compressed Sensing", journal = j-TOIS, volume = "36", number = "2", pages = "17:1--17:??", month = sep, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3086702", ISSN = "1046-8188", bibdate = "Tue Jan 16 07:16:47 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/datacompression.bib; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Compressing textstreams generated by social networks can both reduce storage consumption and improve efficiency such as fast searching. However, the compression process is a challenge due to the large scale of textstreams. In this article, we propose a textstream compression framework based on compressed sensing theory and design a series of matching parallel procedures. The new approach uses a linear projection technique in the textstream compression process, achieving fast compression speed and low compression ratio. Two processes are executed by designing elaborated parallel procedures for efficient compressing and decompressing of large-scale textstreams. The decompression process is implemented for approximate solutions of underdetermined linear systems. Experimental results show that the new method can efficiently achieve the compression and decompression tasks on a large amount of text generated by social networks.", acknowledgement = ack-nhfb, articleno = "17", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Zhou:2017:MMD, author = "Guang-You Zhou and Jimmy Xiangji Huang", title = "Modeling and Mining Domain Shared Knowledge for Sentiment Analysis", journal = j-TOIS, volume = "36", number = "2", pages = "18:1--18:??", month = sep, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3091995", ISSN = "1046-8188", bibdate = "Tue Jan 16 07:16:47 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Sentiment classification aims to automatically predict sentiment polarity (e.g., positive or negative) of user generated sentiment data (e.g., reviews, blogs). In real applications, these user-generated sentiment data can span so many different domains that it is difficult to label the training data for all of them. Therefore, we study the problem of sentiment classification adaptation task in this article. That is, a system is trained to label reviews from one source domain but is meant to be used on the target domain. One of the biggest challenges for sentiment classification adaptation task is how to deal with the problem when two data distributions between the source domain and target domain are significantly different from one another. However, our observation is that there might exist some domain shared knowledge among certain input dimensions of different domains. In this article, we present a novel method for modeling and mining the domain shared knowledge from different sentiment review domains via a joint non-negative matrix factorization-based framework. In this proposed framework, we attempt to learn the domain shared knowledge and the domain-specific information from different sentiment review domains with several various regularization constraints. The advantage of the proposed method can promote the correspondence under the topic space between the source domain and the target domain, which can significantly reduce the data distribution gap across two domains. We conduct extensive experiments on two real-world balanced data sets from Amazon product reviews for sentence-level and document-level binary sentiment classification. Experimental results show that our proposed approach significantly outperforms several strong baselines and achieves an accuracy that is competitive with the most well-known methods for sentiment classification adaptation.", acknowledgement = ack-nhfb, articleno = "18", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Ferro:2017:WDA, author = "Nicola Ferro", title = "What Does Affect the Correlation Among Evaluation Measures?", journal = j-TOIS, volume = "36", number = "2", pages = "19:1--19:??", month = sep, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3106371", ISSN = "1046-8188", bibdate = "Tue Jan 16 07:16:47 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Information Retrieval (IR) is well-known for the great number of adopted evaluation measures, with new ones popping up more and more frequently. In this context, correlation analysis is the tool used to study the evaluation measures and to let us understand if two measures rank systems similarly, if they grasp different aspects of system performances or actually reflect different user models, if a new measure is well motivated or not. To this end, the two most commonly used correlation coefficients are the Kendall's $ \tau $ correlation and the AP correlation $ \tau_{\rm AP} $. The goal of the article is to investigate the properties of the tool, that is, correlation analysis, we use to study evaluation measures. In particular, we investigate three research questions about these two correlation coefficients: (i) what is the effect of the number of systems and topics? (ii) what is the effect of removing low-performing systems? (iii) what is the effect of the experimental collections? To answer these research questions, we propose a methodology based on General Linear Mixed Model (GLMM) and ANalysis Of VAriance (ANOVA) to isolate the effects of the number of topics, number of systems, and experimental collections and to let us observe expected correlation values, net from these effects, which are stable and reliable. We learned that the effect of the number of topics is more prominent than the effect of the number of systems. Even if it produces different absolute values, the effect of removing low-performing systems does not seem to provide information substantially different from not removing them, especially when comparing a whole set of evaluation measures. Finally, we found out that both document corpora and topic sets affect the correlation among evaluation measures, the effect of the latter being more prominent. Moreover, there is a substantial interaction between evaluation measures, corpora and topic sets, meaning that the correlation between different evaluation measures can be substantially increased or decreased depending on the different corpora and topics at hand.", acknowledgement = ack-nhfb, articleno = "19", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Ferrante:2017:AEE, author = "Marco Ferrante and Nicola Ferro and Maria Maistro", title = "{AWARE}: Exploiting Evaluation Measures to Combine Multiple Assessors", journal = j-TOIS, volume = "36", number = "2", pages = "20:1--20:??", month = sep, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3110217", ISSN = "1046-8188", bibdate = "Tue Jan 16 07:16:47 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "We propose the Assessor-driven Weighted Averages for Retrieval Evaluation (AWARE) probabilistic framework, a novel methodology for dealing with multiple crowd assessors that may be contradictory and/or noisy. By modeling relevance judgements and crowd assessors as sources of uncertainty, AWARE takes the expectation of a generic performance measure, like Average Precision, composed with these random variables. In this way, it approaches the problem of aggregating different crowd assessors from a new perspective, that is, directly combining the performance measures computed on the ground truth generated by the crowd assessors instead of adopting some classification technique to merge the labels produced by them. We propose several unsupervised estimators that instantiate the AWARE framework and we compare them with state-of-the-art approaches, that is,Majoriity Vote and Expectation Maximization, on TREC collections. We found that AWARE approaches improve in terms of their capability of correctly ranking systems and predicting their actual performance scores.", acknowledgement = ack-nhfb, articleno = "20", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Bai:2017:ULI, author = "Xiao Bai and Ioannis Arapakis and B. Barla Cambazoglu and Ana Freire", title = "Understanding and Leveraging the Impact of Response Latency on User Behaviour in {Web} Search", journal = j-TOIS, volume = "36", number = "2", pages = "21:1--21:??", month = sep, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3106372", ISSN = "1046-8188", bibdate = "Tue Jan 16 07:16:47 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The interplay between the response latency of web search systems and users' search experience has only recently started to attract research attention, despite the important implications of response latency on monetisation of such systems. In this work, we carry out two complementary studies to investigate the impact of response latency on users' searching behaviour in web search engines. We first conduct a controlled user study to investigate the sensitivity of users to increasing delays in response latency. This study shows that the users of a fast search system are more sensitive to delays than the users of a slow search system. Moreover, the study finds that users are more likely to notice the response latency delays beyond a certain latency threshold, their search experience potentially being affected. We then analyse a large number of search queries obtained from Yahoo Web Search to investigate the impact of response latency on users' click behaviour. This analysis demonstrates the significant change in click behaviour as the response latency increases. We also find that certain user, context, and query attributes play a role in the way increasing response latency affects the click behaviour. To demonstrate a possible use case for our findings, we devise a machine-learning framework that leverages the latency impact, together with other features, to predict whether a user will issue any clicks on web search results. As a further extension of this use case, we investigate whether this machine-learning framework can be exploited to help search engines reduce their energy consumption during query processing.", acknowledgement = ack-nhfb, articleno = "21", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Shi:2017:LRB, author = "Lei Shi and Wayne Xin Zhao and Yi-Dong Shen", title = "Local Representative-Based Matrix Factorization for Cold-Start Recommendation", journal = j-TOIS, volume = "36", number = "2", pages = "22:1--22:??", month = sep, year = "2017", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3108148", ISSN = "1046-8188", bibdate = "Tue Jan 16 07:16:47 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Cold-start recommendation is one of the most challenging problems in recommender systems. An important approach to cold-start recommendation is to conduct an interview for new users, called the interview-based approach. Among the interview-based methods, Representative-Based Matrix Factorization (RBMF) [24] provides an effective solution with appealing merits: it represents users over selected representative items, which makes the recommendations highly intuitive and interpretable. However, RBMF only utilizes a global set of representative items to model all users. Such a representation is somehow too strict and may not be flexible enough to capture varying users' interests. To address this problem, we propose a novel interview-based model to dynamically create meaningful user groups using decision trees and then select local representative items for different groups. A two-round interview is performed for a new user. In the first round, $ l_1 $ global questions are issued for group division, while in the second round, $ l_2 $ local-group-specific questions are given to derive local representation. We collect the feedback on the $ (l_1 + l_2) $ items to learn the user representations. By putting these steps together, we develop a joint optimization model, named local representative-based matrix factorization, for new user recommendations. Extensive experiments on three public datasets have demonstrated the effectiveness of the proposed model compared with several competitive baselines.", acknowledgement = ack-nhfb, articleno = "22", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Arampatzis:2018:SPI, author = "Avi Arampatzis and Georgios Kalamatianos", title = "Suggesting Points-of-Interest via Content-Based, Collaborative, and Hybrid Fusion Methods in Mobile Devices", journal = j-TOIS, volume = "36", number = "3", pages = "23:1--23:??", month = apr, year = "2018", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3125620", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:51:59 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Recommending venues or points-of-interest (POIs) is a hot topic in recent years, especially for tourism applications and mobile users. We propose and evaluate several suggestion methods, taking an effectiveness, feasibility, efficiency, and privacy perspective. The task is addressed by two content-based methods (a Weighted kNN classifier and a Rated Rocchio personalized query), Collaborative Filtering methods, as well as several (rank-based or rating-based) methods of merging results of different systems. Effectiveness is evaluated on two standard benchmark datasets, provided and used by TREC's Contextual Suggestion Tracks in 2015 and 2016. First, we enrich these datasets with more information on venues, collected from web services like Foursquare and Yelp; we make this extra data available for future experimentation. Then, we find that the content-based methods provide state-of-the-art effectiveness, the collaborative filtering variants mostly suffer from data sparsity problems in the current datasets, and the merging methods further improve results by mainly promoting the first relevant suggestion. Concerning mobile feasibility, efficiency, and user privacy, the content-based methods, especially Rated Rocchio, are the best. Collaborative filtering has the worst efficiency and privacy leaks. Our findings can be very useful for developing effective and efficient operational systems, respecting user privacy. Last, our experiments indicate that better benchmark datasets would be welcome, and the use of additional evaluation measures-more sensitive in recall-is recommended.", acknowledgement = ack-nhfb, articleno = "23", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Zhao:2018:TEF, author = "Jingwen Zhao and Yunjun Gao and Gang Chen and Rui Chen", title = "Towards Efficient Framework for Time-Aware Spatial Keyword Queries on Road Networks", journal = j-TOIS, volume = "36", number = "3", pages = "24:1--24:??", month = apr, year = "2018", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3143802", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:51:59 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The spatial keyword query takes as inputs a query location and a set of query keywords and returns the answer objects by considering both their spatial distances to the query location and textual similarity with the query keywords. However, temporal information plays an important role in the spatial keyword query (where there is, to our knowledge, no prior work considering temporal information of the objects), since objects are not always valid. For instance, visitors may plan their trips according to the opening hours of attractions. Moreover, in real-life applications, objects are located on a predefined road network, and the spatial proximity of two objects is measured by the shortest path distance or travelling time between them. In this article, we study the problem of time-aware spatial keyword (TSK) query, which assumes that objects are located on the road network, and finds the k objects satisfying users' spatio-temporal description and textual constraint. We first present the pruning strategy and algorithm based on an existing index. Then, we design an efficient index structure called TG index and propose several algorithms using the TG index that can prune the search space with both spatio-temporal and textual information simultaneously. Further, we show that the TG index technique can also be applied to improve the performance of time-travel text search and spatial keyword query. Extensive experiments using both real and synthetic datasets demonstrate the effectiveness and efficiency of the presented index and algorithms.", acknowledgement = ack-nhfb, articleno = "24", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{McCreadie:2018:EDE, author = "Richard McCreadie and Rodrygo L. T. Santos and Craig Macdonald and Iadh Ounis", title = "Explicit Diversification of Event Aspects for Temporal Summarization", journal = j-TOIS, volume = "36", number = "3", pages = "25:1--25:??", month = apr, year = "2018", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3158671", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:51:59 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "During major events, such as emergencies and disasters, a large volume of information is reported on newswire and social media platforms. Temporal summarization (TS) approaches are used to automatically produce concise overviews of such events by extracting text snippets from related articles over time. Current TS approaches rely on a combination of event relevance and textual novelty for snippet selection. However, for events that span multiple days, textual novelty is often a poor criterion for selecting snippets, since many snippets are textually unique but are semantically redundant or non-informative. In this article, we propose a framework for the diversification of snippets using explicit event aspects, building on recent works in search result diversification. In particular, we first propose two techniques to identify explicit aspects that a user might want to see covered in a summary for different types of event. We then extend a state-of-the-art explicit diversification framework to maximize the coverage of these aspects when selecting summary snippets for unseen events. Through experimentation over the TREC TS 2013, 2014, and 2015 datasets, we show that explicit diversification for temporal summarization significantly outperforms classical novelty-based diversification, as the use of explicit event aspects reduces the amount of redundant and off-topic snippets returned, while also increasing summary timeliness.", acknowledgement = ack-nhfb, articleno = "25", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Chong:2018:EUV, author = "Wen-Haw Chong and Ee-Peng Lim", title = "Exploiting User and Venue Characteristics for Fine-Grained Tweet Geolocation", journal = j-TOIS, volume = "36", number = "3", pages = "26:1--26:??", month = apr, year = "2018", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3156667", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:51:59 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Which venue is a tweet posted from? We call this a fine-grained geolocation problem. Given an observed tweet, the task is to infer its discrete posting venue, e.g., a specific restaurant. This recovers the venue context and differs from prior work, which geolocats tweets to location coordinates or cities/neighborhoods. First, we conduct empirical analysis to uncover venue and user characteristics for improving geolocation. For venues, we observe spatial homophily, in which venues near each other have more similar tweet content (i.e., text representations) compared to venues further apart. For users, we observe that they are spatially focused and more likely to visit venues near their previous visits. We also find that a substantial proportion of users post one or more geocoded tweet(s), thus providing their location history data. We then propose geolocation models that exploit spatial homophily and spatial focus characteristics plus posting time information. Our models rank candidate venues of test tweets such that the actual posting venue is ranked high. To better tune model parameters, we introduce a learning-to-rank framework. Our best model significantly outperforms state-of-the-art baselines. Furthermore, we show that tweets without any location-indicative words can be geolocated meaningfully as well.", acknowledgement = ack-nhfb, articleno = "26", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Zhao:2018:ALT, author = "Wayne Xin Zhao and Wenhui Zhang and Yulan He and Xing Xie and Ji-Rong Wen", title = "Automatically Learning Topics and Difficulty Levels of Problems in Online Judge Systems", journal = j-TOIS, volume = "36", number = "3", pages = "27:1--27:??", month = apr, year = "2018", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3158670", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:51:59 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Online Judge (OJ) systems have been widely used in many areas, including programming, mathematical problems solving, and job interviews. Unlike other online learning systems, such as Massive Open Online Course, most OJ systems are designed for self-directed learning without the intervention of teachers. Also, in most OJ systems, problems are simply listed in volumes and there is no clear organization of them by topics or difficulty levels. As such, problems in the same volume are mixed in terms of topics or difficulty levels. By analyzing large-scale users' learning traces, we observe that there are two major learning modes (or patterns). Users either practice problems in a sequential manner from the same volume regardless of their topics or they attempt problems about the same topic, which may spread across multiple volumes. Our observation is consistent with the findings in classic educational psychology. Based on our observation, we propose a novel two-mode Markov topic model to automatically detect the topics of online problems by jointly characterizing the two learning modes. For further predicting the difficulty level of online problems, we propose a competition-based expertise model using the learned topic information. Extensive experiments on three large OJ datasets have demonstrated the effectiveness of our approach in three different tasks, including skill topic extraction, expertise competition prediction and problem recommendation.", acknowledgement = ack-nhfb, articleno = "27", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Levi:2018:SCP, author = "Or Levi and Ido Guy and Fiana Raiber and Oren Kurland", title = "Selective Cluster Presentation on the Search Results Page", journal = j-TOIS, volume = "36", number = "3", pages = "28:1--28:??", month = apr, year = "2018", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3158672", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:51:59 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Web search engines present, for some queries, a cluster of results from the same specialized domain (``vertical'') on the search results page (SERP). We introduce a comprehensive analysis of the presentation of such clusters from seven different verticals based on the logs of a commercial Web search engine. This analysis reveals several unique characteristics-such as size, rank, and clicks-of result clusters from community question-and-answer websites. The study of properties of this result cluster-specifically as part of the SERP-has received little attention in previous work. Our analysis also motivates the pursuit of a long-standing challenge in ad hoc retrieval, namely, selective cluster retrieval. In our setting, the specific challenge is to select for presentation the documents most highly ranked either by a cluster-based approach (those in the top-retrieved cluster) or by a document-based approach. We address this classification task by representing queries with features based on those utilized for ranking the clusters, query-performance predictors, and properties of the document-clustering structure. Empirical evaluation performed with TREC data shows that our approach outperforms a recently proposed state-of-the-art cluster-based document-retrieval method as well as state-of-the-art document-retrieval methods that do not account for inter-document similarities.", acknowledgement = ack-nhfb, articleno = "28", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Liao:2018:JMP, author = "Yi Liao and Wai Lam and Lidong Bing and Xin Shen", title = "Joint Modeling of Participant Influence and Latent Topics for Recommendation in Event-based Social Networks", journal = j-TOIS, volume = "36", number = "3", pages = "29:1--29:??", month = apr, year = "2018", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3183712", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:51:59 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Event-based social networks (EBSNs) are becoming popular in recent years. Users can publish a planned event on an EBSN website, calling for other users to participate in the event. When a user is making a decision on whether to participate in an event in EBSNs, one aspect for consideration is existing participants defined as users who have agreed to join this event. Existing participants of the event may affect the decision of the user, to which we refer as participant influence. However, participant influence is not well studied by previous works. In this article, we propose an event recommendation model that considers participant influence, and exploits the influence of existing participants on the decisions of new participants based on Poisson factorization. The effect of participant influence is associated with the target event, the host group of the event, and the location of the event. Furthermore, our proposed model can extract latent event topics from event text descriptions, and characterize events, groups, and locations by distributions of event topics. Associations between latent event topics and participant influence are exploited for improving event recommendation. Besides making event recommendation, the proposed model is able to reveal the semantic properties of the participant influence between two users semantically. We have conducted extensive experiments on some datasets extracted from a real-world EBSN. Our proposed model achieves superior event recommendation performance over several state-of-the-art models. The results demonstrate that the consideration of participant influence can improve event recommendation.", acknowledgement = ack-nhfb, articleno = "29", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Guy:2018:CVS, author = "Ido Guy", title = "The Characteristics of Voice Search: Comparing Spoken with Typed-in Mobile {Web} Search Queries", journal = j-TOIS, volume = "36", number = "3", pages = "30:1--30:??", month = apr, year = "2018", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3182163", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:51:59 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The growing popularity of mobile search and the advancement in voice recognition technologies have opened the door for web search users to speak their queries rather than type them. While this kind of voice search is still in its infancy, it is gradually becoming more widespread. In this article, we report a comprehensive voice search query log analysis of a commercial web search engine's mobile application. We compare voice and text search by various aspects, with special focus on the semantic and syntactic characteristics of the queries. Our analysis suggests that voice queries focus more on audio-visual content and question answering and less on social networking and adult domains. In addition, voice queries are more commonly submitted on the go. We also conduct an empirical evaluation showing that the language of voice queries is closer to natural language than the language of text queries. Our analysis points out further differences between voice and text search. We discuss the implications of these differences for the design of future voice-enabled web search tools.", acknowledgement = ack-nhfb, articleno = "30", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Guo:2018:CIP, author = "Long Guo and Dongxiang Zhang and Yuan Wang and Huayu Wu and Bin Cui and Kian-Lee Tan", title = "{CO} 2: Inferring Personal Interests From Raw Footprints by Connecting the Offline World with the Online World", journal = j-TOIS, volume = "36", number = "3", pages = "31:1--31:??", month = apr, year = "2018", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3182164", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:51:59 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "User-generated trajectories (UGTs), such as travel records from bus companies, capture rich information of human mobility in the offline world. However, some interesting applications of these raw footprints have not been exploited well due to the lack of textual information to infer the subject's personal interests. Although there is rich semantic information contained in the spatial- and temporal-aware user-generated contents (STUGC) published in the online world, such as Twitter, less effort has been made to utilize this information to facilitate the interest discovery process. In this article, we design an effective probabilistic framework named CO$^2$ to connect the offline world with the online world in order to discover users' interests directly from their raw footprints in UGT. CO$^2$ first infers trip intentions by utilizing the semantic information in STUGC and then discovers user interests by aggregating the intentions. To evaluate the effectiveness of CO$^2$, we use two large-scale real-world datasets as a case study and further conduct a questionnaire survey to show the superior performance of CO$^2$.", acknowledgement = ack-nhfb, articleno = "31", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Yang:2018:ULP, author = "Jing Yang and Carsten Eickhoff", title = "Unsupervised Learning of Parsimonious General-Purpose Embeddings for User and Location Modeling", journal = j-TOIS, volume = "36", number = "3", pages = "32:1--32:??", month = apr, year = "2018", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3182165", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:51:59 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Many social network applications depend on robust representations of spatio-temporal data. In this work, we present an embedding model based on feed-forward neural networks which transforms social media check-ins into dense feature vectors encoding geographic, temporal, and functional aspects for modeling places, neighborhoods, and users. We employ the embedding model in a variety of applications including location recommendation, urban functional zone study, and crime prediction. For location recommendation, we propose a Spatio-Temporal Embedding Similarity algorithm (STES) based on the embedding model. In a range of experiments on real life data collected from Foursquare, we demonstrate our model's effectiveness at characterizing places and people and its applicability in aforementioned problem domains. Finally, we select eight major cities around the globe and verify the robustness and generality of our model by porting pre-trained models from one city to another, thereby alleviating the need for costly local training.", acknowledgement = ack-nhfb, articleno = "32", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Lian:2018:GSL, author = "Defu Lian and Kai Zheng and Yong Ge and Longbing Cao and Enhong Chen and Xing Xie", title = "{GeoMF++}: Scalable Location Recommendation via Joint Geographical Modeling and Matrix Factorization", journal = j-TOIS, volume = "36", number = "3", pages = "33:1--33:??", month = apr, year = "2018", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3182166", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:51:59 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Location recommendation is an important means to help people discover attractive locations. However, extreme sparsity of user-location matrices leads to a severe challenge, so it is necessary to take implicit feedback characteristics of user mobility data into account and leverage the location's spatial information. To this end, based on previously developed GeoMF, we propose a scalable and flexible framework, dubbed GeoMF++, for joint geographical modeling and implicit feedback-based matrix factorization. We then develop an efficient optimization algorithm for parameter learning, which scales linearly with data size and the total number of neighbor grids of all locations. GeoMF++ can be well explained from two perspectives. First, it subsumes two-dimensional kernel density estimation so that it captures spatial clustering phenomenon in user mobility data; Second, it is strongly connected with widely used neighbor additive models, graph Laplacian regularized models, and collective matrix factorization. Finally, we extensively evaluate GeoMF++ on two large-scale LBSN datasets. The experimental results show that GeoMF++ consistently outperforms the state-of-the-art and other competing baselines on both datasets in terms of NDCG and Recall. Besides, the efficiency studies show that GeoMF++ is much more scalable with the increase of data size and the dimension of latent space.", acknowledgement = ack-nhfb, articleno = "33", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Tan:2018:QTQ, author = "Jiwei Tan and Xiaojun Wan and Hui Liu and Jianguo Xiao", title = "{QuoteRec}: Toward Quote Recommendation for Writing", journal = j-TOIS, volume = "36", number = "3", pages = "34:1--34:??", month = apr, year = "2018", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3183370", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:51:59 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Quote is a language phenomenon of transcribing the statement of someone else, such as a proverb and a famous saying. An appropriate usage of quote usually equips the expression with more elegance and credibility. However, there are times when we are eager to stress our idea by citing a quote, while nothing relevant comes to mind. Therefore, it is exciting to have a recommender system which provides quote recommendations while we are writing. This article extends previous study of quote recommendation, the task that recommends the appropriate quote according to the context (i.e., the content occurring before and after the quote). In this article, a quote recommender system called QuoteRec is presented to tackle the task. We investigate two models to learn the vector representations of quotes and contexts, and then rank the candidate quotes based on the representations. The first model learns the quote representation according to the contexts of a quote. The second model is an extension of the neural network model in previous study, which learns the representation of a quote by concerning both its content and contexts. Experimental results demonstrate the effectiveness of the two models in learning the semantic representations of quotes, and the neural network model achieves state-of-the-art results on the quote recommendation task.", acknowledgement = ack-nhfb, articleno = "34", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Nelissen:2018:STU, author = "Klaas Nelissen and Monique Snoeck and Seppe {Vanden Broucke} and Bart Baesens", title = "Swipe and Tell: Using Implicit Feedback to Predict User Engagement on Tablets", journal = j-TOIS, volume = "36", number = "4", pages = "35:1--35:??", month = oct, year = "2018", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3185153", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:51:59 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "When content consumers explicitly judge content positively, we consider them to be engaged. Unfortunately, explicit user evaluations are difficult to collect, as they require user effort. Therefore, we propose to use device interactions as implicit feedback to detect engagement. We assess the usefulness of swipe interactions on tablets for predicting engagement and make the comparison with using traditional features based on time spent. We gathered two unique datasets of more than 250,000 swipes, 100,000 unique article visits, and over 35,000 explicitly judged news articles by modifying two commonly used tablet apps of two newspapers. We tracked all device interactions of 407 experiment participants during one month of habitual news reading. We employed a behavioral metric as a proxy for engagement, because our analysis needed to be scalable to many users, and scanning behavior required us to allow users to indicate engagement quickly. We point out the importance of taking into account content ordering, report the most predictive features, zoom in on briefly read content and on the most frequently read articles. Our findings demonstrate that fine-grained tablet interactions are useful indicators of engagement for newsreaders on tablets. The best features successfully combine both time-based aspects and swipe interactions.", acknowledgement = ack-nhfb, articleno = "35", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Goldberg:2018:FID, author = "David Goldberg and Andrew Trotman and Xiao Wang and Wei Min and Zongru Wan", title = "Further Insights on Drawing Sound Conclusions from Noisy Judgments", journal = j-TOIS, volume = "36", number = "4", pages = "36:1--36:??", month = oct, year = "2018", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3186195", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:51:59 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The effectiveness of a search engine is typically evaluated using hand-labeled datasets, where the labels indicate the relevance of documents to queries. Often the number of labels needed is too large to be created by the best annotators, and so less expensive labels (e.g., from crowdsourcing) are used. This introduces errors in the labels, and thus errors in standard effectiveness metrics (such as P@k and DCG). These errors must be taken into consideration when using the metrics. Previous work has approached assessor error by taking aggregates over multiple inexpensive assessors. We take a different approach and introduce equations and algorithms that can adjust the metrics to the values they would have had if there were no annotation errors. This is especially important when two search engines are compared on their metrics. We give examples where one engine appeared to be statistically significantly better than the other, but the effect disappeared after the metrics were corrected for annotation error. In other words, the evidence supporting a statistical difference was illusory and caused by a failure to account for annotation error.", acknowledgement = ack-nhfb, articleno = "36", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Bekhet:2018:ISB, author = "Saddam Bekhet and Amr Ahmed", title = "An Integrated Signature-Based Framework for Efficient Visual Similarity Detection and Measurement in Video Shots", journal = j-TOIS, volume = "36", number = "4", pages = "37:1--37:??", month = oct, year = "2018", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3190784", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:51:59 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "This article presents a framework for speedy video matching and retrieval through detection and measurement of visual similarity. The framework's efficiency stems from its power to encode a given shot content into a compact fixed-length signature that helps in robust real-time matching. Separate scene and motion signatures are developed and fused together to fully represent and match respective video shots. Scene information is captured through the Statistical Dominant Color Profile (SDCP), while motion information is captured through a graph-based signature called the Dominant Color Graph Profile (DCGP). The SDCP is a fixed-length compact signature that statistically encodes the colors' spatiotemporal patterns across video frames. The DCGP is a fixed-length signature that records and tracks the gray levels across subsampled video frames, where the graph structural properties are used to extract the signature values. Finally, the overall video signature is generated by fusing the individual scene and motion signatures. The signature-based aspect of the proposed framework is the key to its high matching speed (> 2000 fps) compared to current techniques that rely on exhaustive processing. To maximize the benefit of the framework, compressed-domain videos are utilized as a case study following their wide availability. However, the framework avoids full video decompression and operates on tiny frames rather than full-size decompressed frames. Experiments on various standard and challenging dataset groups show the framework's robust performance in terms of both retrieval and computational performance.", acknowledgement = ack-nhfb, articleno = "37", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{VanGysel:2018:NVS, author = "Christophe {Van Gysel} and Maarten de Rijke and Evangelos Kanoulas", title = "Neural Vector Spaces for Unsupervised Information Retrieval", journal = j-TOIS, volume = "36", number = "4", pages = "38:1--38:??", month = oct, year = "2018", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3196826", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:51:59 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "We propose the Neural Vector Space Model (NVSM), a method that learns representations of documents in an unsupervised manner for news article retrieval. In the NVSM paradigm, we learn low-dimensional representations of words and documents from scratch using gradient descent and rank documents according to their similarity with query representations that are composed from word representations. We show that NVSM performs better at document ranking than existing latent semantic vector space methods. The addition of NVSM to a mixture of lexical language models and a state-of-the-art baseline vector space model yields a statistically significant increase in retrieval effectiveness. Consequently, NVSM adds a complementary relevance signal. Next to semantic matching, we find that NVSM performs well in cases where lexical matching is needed. NVSM learns a notion of term specificity directly from the document collection without feature engineering. We also show that NVSM learns regularities related to Luhn significance. Finally, we give advice on how to deploy NVSM in situations where model selection (e.g., cross-validation) is infeasible. We find that an unsupervised ensemble of multiple models trained with different hyperparameter values performs better than a single cross-validated model. Therefore, NVSM can safely be used for ranking documents without supervised relevance judgments.", acknowledgement = ack-nhfb, articleno = "38", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Ren:2018:SRE, author = "Pengjie Ren and Zhumin Chen and Zhaochun Ren and Furu Wei and Liqiang Nie and Jun Ma and Maarten de Rijke", title = "Sentence Relations for Extractive Summarization with Deep Neural Networks", journal = j-TOIS, volume = "36", number = "4", pages = "39:1--39:??", month = oct, year = "2018", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3200864", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:51:59 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Sentence regression is a type of extractive summarization that achieves state-of-the-art performance and is commonly used in practical systems. The most challenging task within the sentence regression framework is to identify discriminative features to represent each sentence. In this article, we study the use of sentence relations, e.g., Contextual Sentence Relations (CSR), Title Sentence Relations (TSR), and Query Sentence Relations (QSR), so as to improve the performance of sentence regression. CSR, TSR, and QSR refer to the relations between a main body sentence and its local context, its document title, and a given query, respectively. We propose a deep neural network model, Sentence Relation-based Summarization (SRSum), that consists of five sub-models, PriorSum, CSRSum, TSRSum, QSRSum, and SFSum. PriorSum encodes the latent semantic meaning of a sentence using a bi-gram convolutional neural network. SFSum encodes the surface information of a sentence, e.g., sentence length, sentence position, and so on. CSRSum, TSRSum, and QSRSum are three sentence relation sub-models corresponding to CSR, TSR, and QSR, respectively. CSRSum evaluates the ability of each sentence to summarize its local contexts. Specifically, CSRSum applies a CSR-based word-level and sentence-level attention mechanism to simulate the context-aware reading of a human reader, where words and sentences that have anaphoric relations or local summarization abilities are easily remembered and paid attention to. TSRSum evaluates the semantic closeness of each sentence with respect to its title, which usually reflects the main ideas of a document. TSRSum applies a TSR-based attention mechanism to simulate people's reading ability with the main idea (title) in mind. QSRSum evaluates the relevance of each sentence with given queries for the query-focused summarization. QSRSum applies a QSR-based attention mechanism to simulate the attentive reading of a human reader with some queries in mind. The mechanism can recognize which parts of the given queries are more likely answered by a sentence under consideration. Finally as a whole, SRSum automatically learns useful latent features by jointly learning representations of query sentences, content sentences, and title sentences as well as their relations. We conduct extensive experiments on six benchmark datasets, including generic multi-document summarization and query-focused multi-document summarization. On both tasks, SRSum achieves comparable or superior performance compared with state-of-the-art approaches in terms of multiple ROUGE metrics.", acknowledgement = ack-nhfb, articleno = "39", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Middleton:2018:LES, author = "Stuart E. Middleton and Giorgos Kordopatis-Zilos and Symeon Papadopoulos and Yiannis Kompatsiaris", title = "Location Extraction from Social Media: Geoparsing, Location Disambiguation, and Geotagging", journal = j-TOIS, volume = "36", number = "4", pages = "40:1--40:??", month = oct, year = "2018", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3202662", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:51:59 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Location extraction, also called ``toponym extraction,'' is a field covering geoparsing, extracting spatial representations from location mentions in text, and geotagging, assigning spatial coordinates to content items. This article evaluates five ``best-of-class'' location extraction algorithms. We develop a geoparsing algorithm using an OpenStreetMap database, and a geotagging algorithm using a language model constructed from social media tags and multiple gazetteers. Third-party work evaluated includes a DBpedia-based entity recognition and disambiguation approach, a named entity recognition and Geonames gazetteer approach, and a Google Geocoder API approach. We perform two quantitative benchmark evaluations, one geoparsing tweets and one geotagging Flickr posts, to compare all approaches. We also perform a qualitative evaluation recalling top N location mentions from tweets during major news events. The OpenStreetMap approach was best (F1 0.90+) for geoparsing English, and the language model approach was best (F1 0.66) for Turkish. The language model was best (F1@1km 0.49) for the geotagging evaluation. The map database was best (R@20 0.60+) in the qualitative evaluation. We report on strengths, weaknesses, and a detailed failure analysis for the approaches and suggest concrete areas for further research.", acknowledgement = ack-nhfb, articleno = "40", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Arguello:2018:FIU, author = "Jaime Arguello and Bogeum Choi and Robert Capra", title = "Factors Influencing Users' Information Requests: Medium, Target, and Extra-Topical Dimension", journal = j-TOIS, volume = "36", number = "4", pages = "41:1--41:??", month = oct, year = "2018", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3209624", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:51:59 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "We report on a crowdsourced study that investigated how two factors influence the way people formulate information requests. Our first factor, medium, considers whether the request is produced using text or voice. Our second factor, target, considers whether the request is intended for a search engine or a human intermediary (i.e., someone who will search on the user's behalf). In particular, we study how these two factors influence the way people formulate requests in situations where the information need has a specific type of extra-topical dimension (i.e., a type of constraint that is independent from the information need's topic). We focus on six extra-topical dimensions: (1) domain knowledge, (2) viewpoint, (3) experiential, (4) venue location, (5) source location, and (6) temporal. The extra-topical dimension was manipulated by giving participants carefully constructed search tasks. We analyzed a large number of information requests produced by study participants, and address three research questions. We study the effects of our two factors (medium and target) on (RQ1) participants' perceptions about their own information requests, (RQ2) the different characteristics of their information requests (e.g., natural language structure, retrieval performance), and (RQ3) participants' strategies for requesting information when the search task has a specific type of extra-topical dimension. Our results found that both factors influenced participants' perceptions about their own information requests, the characteristics of participants' requests, and the strategies adopted by participants to request information matching the extra-topical dimension. Our results have implications for future research on methods that can harness (rather than ignore) extra-topical query terms to retrieve relevant information.", acknowledgement = ack-nhfb, articleno = "41", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Mao:2018:HDD, author = "Jiaxin Mao and Yiqun Liu and Noriko Kando and Min Zhang and Shaoping Ma", title = "How Does Domain Expertise Affect Users' Search Interaction and Outcome in Exploratory Search?", journal = j-TOIS, volume = "36", number = "4", pages = "42:1--42:??", month = oct, year = "2018", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3223045", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:51:59 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "People often conduct exploratory search to explore unfamiliar information space and learn new knowledge. While supporting the highly dynamic and interactive exploratory search is still challenging for the search system, we want to investigate which factors can make the exploratory search successful and satisfying from the user's perspective. Previous research suggests that domain experts have different search strategies and are more successful in finding domain-specific information, but how the domain expertise level will influence users' interaction and search outcomes in exploratory search, especially in different knowledge domains, is still unclear. In this work, via a carefully designed user study that involves 30 participants, we investigate the influence of domain expertise levels on the interaction and outcome of exploratory search in three different domains: environment, medicine, and politics. We record participants' search behaviors, including their explicit feedback and eye fixation sequences, in a laboratory setting. With this dataset, we identify both domain-independent and domain-dependent effects on user behaviors and search outcomes. Our results extend existing research on the effect of domain expertise in search and suggest different strategies for exploiting domain expertise to support exploratory search in different knowledge domains.", acknowledgement = ack-nhfb, articleno = "42", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Wang:2018:LAI, author = "Yanhao Wang and Yuchen Li and Ju Fan and Kian-Lee Tan", title = "Location-aware Influence Maximization over Dynamic Social Streams", journal = j-TOIS, volume = "36", number = "4", pages = "43:1--43:??", month = oct, year = "2018", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3230871", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:51:59 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Influence maximization (IM), which selects a set of k seed users (a.k.a., a seed set ) to maximize the influence spread over a social network, is a fundamental problem in a wide range of applications. However, most existing IM algorithms are static and location-unaware. They fail to provide high-quality seed sets efficiently when the social network evolves rapidly and IM queries are location-aware. In this article, we first define two IM queries, namely Stream Influence Maximization (SIM) and Location-aware SIM (LSIM), to track influential users over social streams. Technically, SIM adopts the sliding window model and maintains a seed set with the maximum influence value collectively over the most recent social actions. LSIM further considers social actions are associated with geo-tags and identifies a seed set that maximizes the influence value in a query region over a location-aware social stream. Then, we propose the Sparse Influential Checkpoints (SIC) framework for efficient SIM query processing. SIC maintains a sequence of influential checkpoints over the sliding window and each checkpoint maintains a partial solution for SIM in an append-only substream of social actions. Theoretically, SIC keeps a logarithmic number of checkpoints w.r.t. the size of the sliding window and always returns an approximate solution from one of the checkpoint for the SIM query at any time. Furthermore, we propose the Location-based SIC (LSIC) framework and its improved version LSIC$^+$, both of which process LSIM queries by integrating the SIC framework with a Quadtree spatial index. LSIC can provide approximate solutions for both ad hoc and continuous LSIM queries in real time, while LSIC$^+$ further improves the solution quality of LSIC. Experimental results on real-world datasets demonstrate the effectiveness and efficiency of the proposed frameworks against the state-of-the-art IM algorithms.", acknowledgement = ack-nhfb, articleno = "43", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Ruotsalo:2018:IIM, author = "Tuukka Ruotsalo and Jaakko Peltonen and Manuel J. A. Eugster and Dorota G{\l}owacka and Patrik Flor{\'e}en and Petri Myllym{\"a}ki and Giulio Jacucci and Samuel Kaski", title = "Interactive Intent Modeling for Exploratory Search", journal = j-TOIS, volume = "36", number = "4", pages = "44:1--44:??", month = oct, year = "2018", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3231593", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:51:59 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Exploratory search requires the system to assist the user in comprehending the information space and expressing evolving search intents for iterative exploration and retrieval of information. We introduce interactive intent modeling, a technique that models a user's evolving search intents and visualizes them as keywords for interaction. The user can provide feedback on the keywords, from which the system learns and visualizes an improved intent estimate and retrieves information. We report experiments comparing variants of a system implementing interactive intent modeling to a control system. Data comprising search logs, interaction logs, essay answers, and questionnaires indicate significant improvements in task performance, information retrieval performance over the session, information comprehension performance, and user experience. The improvements in retrieval effectiveness can be attributed to the intent modeling and the effect on users' task performance, breadth of information comprehension, and user experience are shown to be dependent on a richer visualization. Our results demonstrate the utility of combining interactive modeling of search intentions with interactive visualization of the models that can benefit both directing the exploratory search process and making sense of the information space. Our findings can help design personalized systems that support exploratory information seeking and discovery of novel information.", acknowledgement = ack-nhfb, articleno = "44", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Aliannejadi:2018:PCA, author = "Mohammad Aliannejadi and Fabio Crestani", title = "Personalized Context-Aware Point of Interest Recommendation", journal = j-TOIS, volume = "36", number = "4", pages = "45:1--45:??", month = oct, year = "2018", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3231933", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:51:59 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Personalized recommendation of Points of Interest (POIs) plays a key role in satisfying users on Location-Based Social Networks (LBSNs). In this article, we propose a probabilistic model to find the mapping between user-annotated tags and locations' taste keywords. Furthermore, we introduce a dataset on locations' contextual appropriateness and demonstrate its usefulness in predicting the contextual relevance of locations. We investigate four approaches to use our proposed mapping for addressing the data sparsity problem: one model to reduce the dimensionality of location taste keywords and three models to predict user tags for a new location. Moreover, we present different scores calculated from multiple LBSNs and show how we incorporate new information from the mapping into a POI recommendation approach. Then, the computed scores are integrated using learning to rank techniques. The experiments on two TREC datasets show the effectiveness of our approach, beating state-of-the-art methods.", acknowledgement = ack-nhfb, articleno = "45", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Mic:2019:BSS, author = "Vladimir Mic and David Novak and Pavel Zezula", title = "Binary Sketches for Secondary Filtering", journal = j-TOIS, volume = "37", number = "1", pages = "1:1--1:??", month = jan, year = "2019", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3231936", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:52:00 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "This article addresses the problem of matching the most similar data objects to a given query object. We adopt a generic model of similarity that involves the domain of objects and metric distance functions only. We examine the case of a large dataset in a complex data space, which makes this problem inherently difficult. Many indexing and searching approaches have been proposed, but they have often failed to efficiently prune complex search spaces and access large portions of the dataset when evaluating queries. We propose an approach to enhancing the existing search techniques to significantly reduce the number of accessed data objects while preserving the quality of the search results. In particular, we extend each data object with its sketch, a short binary string in Hamming space. These sketches approximate the similarity relationships in the original search space, and we use them to filter out non-relevant objects not pruned by the original search technique. We provide a probabilistic model to tune the parameters of the sketch-based filtering separately for each query object. Experiments conducted with different similarity search techniques and real-life datasets demonstrate that the secondary filtering can speed-up similarity search several times.", acknowledgement = ack-nhfb, articleno = "1", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Safran:2019:ELB, author = "Mejdl Safran and Dunren Che", title = "Efficient Learning-Based Recommendation Algorithms for Top- N Tasks and Top- N Workers in Large-Scale Crowdsourcing Systems", journal = j-TOIS, volume = "37", number = "1", pages = "2:1--2:??", month = jan, year = "2019", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3231934", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:52:00 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The task and worker recommendation problems in crowdsourcing systems have brought up unique characteristics that are not present in traditional recommendation scenarios, i.e., the huge flow of tasks with short lifespans, the importance of workers' capabilities, and the quality of the completed tasks. These unique features make traditional recommendation approaches no longer satisfactory for task and worker recommendation in crowdsourcing systems. In this article, we propose a two-tier data representation scheme (defining a worker--category suitability score and a worker--task attractiveness score ) to support personalized task and worker recommendations. We also extend two optimization methods, namely least mean square error and Bayesian personalized rank, to better fit the characteristics of task/worker recommendation in crowdsourcing systems. We then integrate the proposed representation scheme and the extended optimization methods along with the two adapted popular learning models, i.e., matrix factorization and kNN, and result in two lines of top- N recommendation algorithms for crowdsourcing systems: (1) Top- N -Tasks recommendation algorithms for discovering the top- N most suitable tasks for a given worker and (2) Top- N -Workers recommendation algorithms for identifying the top- N best workers for a task requester. An extensive experimental study is conducted that validates the effectiveness and efficiency of a broad spectrum of algorithms, accompanied by our analysis and the insights gained.", acknowledgement = ack-nhfb, articleno = "2", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Deveaud:2019:LAR, author = "Romain Deveaud and Josiane Mothe and Md Zia Ullah and Jian-Yun Nie", title = "Learning to Adaptively Rank Document Retrieval System Configurations", journal = j-TOIS, volume = "37", number = "1", pages = "3:1--3:??", month = jan, year = "2019", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3231937", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:52:00 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Modern Information Retrieval (IR) systems have become more and more complex, involving a large number of parameters. For example, a system may choose from a set of possible retrieval models (BM25, language model, etc.), or various query expansion parameters, whose values greatly influence the overall retrieval effectiveness. Traditionally, these parameters are set at a system level based on training queries, and the same parameters are then used for different queries. We observe that it may not be easy to set all these parameters separately, since they can be dependent. In addition, a global setting for all queries may not best fit all individual queries with different characteristics. The parameters should be set according to these characteristics. In this article, we propose a novel approach to tackle this problem by dealing with the entire system configurations (i.e., a set of parameters representing an IR system behaviour) instead of selecting a single parameter at a time. The selection of the best configuration is cast as a problem of ranking different possible configurations given a query. We apply learning-to-rank approaches for this task. We exploit both the query features and the system configuration features in the learning-to-rank method so that the selection of configuration is query dependent. The experiments we conducted on four TREC ad hoc collections show that this approach can significantly outperform the traditional method to tune system configuration globally (i.e., grid search) and leads to higher effectiveness than the top performing systems of the TREC tracks. We also perform an ablation analysis on the impact of different features on the model learning capability and show that query expansion features are among the most important for adaptive systems.", acknowledgement = ack-nhfb, articleno = "3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Alakuijala:2019:BGP, author = "Jyrki Alakuijala and Andrea Farruggia and Paolo Ferragina and Eugene Kliuchnikov and Robert Obryk and Zoltan Szabadka and Lode Vandevenne", title = "{Brotli}: a General-Purpose Data Compressor", journal = j-TOIS, volume = "37", number = "1", pages = "4:1--4:??", month = jan, year = "2019", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3231935", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:52:00 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/datacompression.bib; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Brotli is an open source general-purpose data compressor introduced by Google in late 2013 and now adopted in most known browsers and Web servers. It is publicly available on GitHub and its data format was submitted as RFC 7932 in July 2016. Brotli is based on the Lempel--Ziv compression scheme and planned as a generic replacement of Gzip and ZLib. The main goal in its design was to compress data on the Internet, which meant optimizing the resources used at decoding time, while achieving maximal compression density. This article is intended to provide the first thorough, systematic description of the Brotli format as well as a detailed computational and experimental analysis of the main algorithmic blocks underlying the current encoder implementation, together with a comparison against compressors of different families constituting the state-of-the-art either in practice or in theory. This treatment will allow us to raise a set of new algorithmic and software engineering problems that deserve further attention from the scientific community.", acknowledgement = ack-nhfb, articleno = "4", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Qu:2019:PBN, author = "Yanru Qu and Bohui Fang and Weinan Zhang and Ruiming Tang and Minzhe Niu and Huifeng Guo and Yong Yu and Xiuqiang He", title = "Product-Based Neural Networks for User Response Prediction over Multi-Field Categorical Data", journal = j-TOIS, volume = "37", number = "1", pages = "5:1--5:??", month = jan, year = "2019", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3233770", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:52:00 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "User response prediction is a crucial component for personalized information retrieval and filtering scenarios, such as recommender system and web search. The data in user response prediction is mostly in a multi-field categorical format and transformed into sparse representations via one-hot encoding. Due to the sparsity problems in representation and optimization, most research focuses on feature engineering and shallow modeling. Recently, deep neural networks have attracted research attention on such a problem for their high capacity and end-to-end training scheme. In this article, we study user response prediction in the scenario of click prediction. We first analyze a coupled gradient issue in latent vector-based models and propose kernel product to learn field-aware feature interactions. Then, we discuss an insensitive gradient issue in DNN-based models and propose Product-based Neural Network, which adopts a feature extractor to explore feature interactions. Generalizing the kernel product to a net-in-net architecture, we further propose Product-network in Network (PIN), which can generalize previous models. Extensive experiments on four industrial datasets and one contest dataset demonstrate that our models consistently outperform eight baselines on both area under curve and log loss. Besides, PIN makes great click-through rate improvement (relatively 34.67\%) in online A/B test.", acknowledgement = ack-nhfb, articleno = "5", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Huang:2019:QTQ, author = "Heyan Huang and Xiaochi Wei and Liqiang Nie and Xianling Mao and Xin-Shun Xu", title = "From Question to Text: Question-Oriented Feature Attention for Answer Selection", journal = j-TOIS, volume = "37", number = "1", pages = "6:1--6:??", month = jan, year = "2019", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3233771", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:52:00 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Understanding unstructured texts is an essential skill for human beings as it enables knowledge acquisition. Although understanding unstructured texts is easy for we human beings with good education, it is a great challenge for machines. Recently, with the rapid development of artificial intelligence techniques, researchers put efforts to teach machines to understand texts and justify the educated machines by letting them solve the questions upon the given unstructured texts, inspired by the reading comprehension test as we humans do. However, feature effectiveness with respect to different questions significantly hinders the performance of answer selection, because different questions may focus on various aspects of the given text and answer candidates. To solve this problem, we propose a question-oriented feature attention (QFA) mechanism, which learns to weight different engineering features according to the given question, so that important features with respect to the specific question is emphasized accordingly. Experiments on MCTest dataset have well-validated the effectiveness of the proposed method. Additionally, the proposed QFA is applicable to various IR tasks, such as question answering and answer selection. We have verified the applicability on a crawled community-based question-answering dataset.", acknowledgement = ack-nhfb, articleno = "6", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Lu:2019:DBT, author = "Wei Lu and Fu-Lai Chung and Wenhao Jiang and Martin Ester and Wei Liu", title = "A Deep {Bayesian} Tensor-Based System for Video Recommendation", journal = j-TOIS, volume = "37", number = "1", pages = "7:1--7:??", month = jan, year = "2019", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3233773", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:52:00 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "With the availability of abundant online multi-relational video information, recommender systems that can effectively exploit these sorts of data and suggest creatively interesting items will become increasingly important. Recent research illustrates that tensor models offer effective approaches for complex multi-relational data learning and missing element completion. So far, most tensor-based user clustering models have focused on the accuracy of recommendation. Given the dynamic nature of online media, recommendation in this setting is more challenging as it is difficult to capture the users' dynamic topic distributions in sparse data settings as well as to identify unseen items as candidates of recommendation. Targeting at constructing a recommender system that can encourage more creativity, a deep Bayesian probabilistic tensor framework for tag and item recommendation is proposed. During the score ranking processes, a metric called Bayesian surprise is incorporated to increase the creativity of the recommended candidates. The new algorithm, called Deep Canonical PARAFAC Factorization (DCPF), is evaluated on both synthetic and large-scale real-world problems. An empirical study for video recommendation demonstrates the superiority of the proposed model and indicates that it can better capture the latent patterns of interactions and generates interesting recommendations based on creative tag combinations.", acknowledgement = ack-nhfb, articleno = "7", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Tymoshenko:2019:SDS, author = "Kateryna Tymoshenko and Alessandro Moschitti", title = "Shallow and Deep Syntactic\slash Semantic Structures for Passage Reranking in Question-Answering Systems", journal = j-TOIS, volume = "37", number = "1", pages = "8:1--8:??", month = jan, year = "2019", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3233772", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:52:00 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "In this article, we extensively study the use of syntactic and semantic structures obtained with shallow and full syntactic parsers for answer passage reranking. We propose several dependency and constituent-based structures, also enriched with Linked Open Data (LD) knowledge to represent pairs of questions and answer passages. We encode such tree structures in learning-to-rank (L2R) algorithms using tree kernels, which can project them in tree substructure spaces, where each dimension represents a powerful syntactic/semantic feature. Additionally, since we define links between question and passage structures, our tree kernel spaces also include relational structural features. We carried out an extensive comparative experimentation of our models for automatic answer selection benchmarks on different TREC QA corpora as well as the newer Wikipedia-based dataset, namely WikiQA, which has been widely used to test sentence rerankers. The results consistently demonstrate that our structural semantic models achieve the state of the art in passage reranking. In particular, we derived the following important findings: (i) relational syntactic structures are essential to achieve superior results; (ii) models trained with dependency trees can outperform those trained with shallow trees, e.g., in case of sentence reranking; (iii) external knowledge automatically generated with focus and question classifiers is very effective; and (iv) the semantic information derived by LD and incorporated in syntactic structures can be used to replace the knowledge provided by the above-mentioned classifiers. This is a remarkable advantage as it enables our models to increase coverage and portability over new domains.", acknowledgement = ack-nhfb, articleno = "8", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Li:2019:SGT, author = "Chenliang Li and Shiqian Chen and Jian Xing and Aixin Sun and Zongyang Ma", title = "Seed-Guided Topic Model for Document Filtering and Classification", journal = j-TOIS, volume = "37", number = "1", pages = "9:1--9:??", month = jan, year = "2019", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3238250", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:52:00 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "One important necessity is to filter out the irrelevant information and organize the relevant information into meaningful categories. However, developing text classifiers often requires a large number of labeled documents as training examples. Manually labeling documents is costly and time-consuming. More importantly, it becomes unrealistic to know all the categories covered by the documents beforehand. Recently, a few methods have been proposed to label documents by using a small set of relevant keywords for each category, known as dataless text classification. In this article, we propose a seed-guided topic model for the dataless text filtering and classification (named DFC). Given a collection of unlabeled documents, and for each specified category a small set of seed words that are relevant to the semantic meaning of the category, DFC filters out the irrelevant documents and classifies the relevant documents into the corresponding categories through topic influence. DFC models two kinds of topics: category-topics and general-topics. Also, there are two kinds of category-topics: relevant-topics and irrelevant-topics. Each relevant-topic is associated with one specific category, representing its semantic meaning. The irrelevant-topics represent the semantics of the unknown categories covered by the document collection. And the general-topics capture the global semantic information. DFC assumes that each document is associated with a single category-topic and a mixture of general-topics. A novelty of the model is that DFC learns the topics by exploiting the explicit word co-occurrence patterns between the seed words and regular words (i.e., non-seed words) in the document collection. A document is then filtered, or classified, based on its posterior category-topic assignment. Experiments on two widely used datasets show that DFC consistently outperforms the state-of-the-art dataless text classifiers for both classification with filtering and classification without filtering. In many tasks, DFC can also achieve comparable or even better classification accuracy than the state-of-the-art supervised learning solutions. Our experimental results further show that DFC is insensitive to the tuning parameters. Moreover, we conduct a thorough study about the impact of seed words for existing dataless text classification techniques. The results reveal that it is not using more seed words but the document coverage of the seed words for the corresponding category that affects the dataless classification performance.", acknowledgement = ack-nhfb, articleno = "9", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Pan:2019:TRH, author = "Weike Pan and Qiang Yang and Wanling Cai and Yaofeng Chen and Qing Zhang and Xiaogang Peng and Zhong Ming", title = "Transfer to Rank for Heterogeneous One-Class Collaborative Filtering", journal = j-TOIS, volume = "37", number = "1", pages = "10:1--10:??", month = jan, year = "2019", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3243652", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:52:00 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Heterogeneous one-class collaborative filtering is an emerging and important problem in recommender systems, where two different types of one-class feedback, i.e., purchases and browses, are available as input data. The associated challenges include ambiguity of browses, scarcity of purchases, and heterogeneity arising from different feedback. In this article, we propose to model purchases and browses from a new perspective, i.e., users' roles of mixer, browser and purchaser. Specifically, we design a novel transfer learning solution termed role-based transfer to rank (RoToR), which contains two variants, i.e., integrative RoToR and sequential RoToR. In integrative RoToR, we leverage browses into the preference learning task of purchases, in which we take each user as a sophisticated customer (i.e., mixer ) that is able to take different types of feedback into consideration. In sequential RoToR, we aim to simplify the integrative one by decomposing it into two dependent phases according to a typical shopping process. Furthermore, we instantiate both variants using different preference learning paradigms such as pointwise preference learning and pairwise preference learning. Finally, we conduct extensive empirical studies with various baseline methods on three large public datasets and find that our RoToR can perform significantly more accurate than the state-of-the-art methods.", acknowledgement = ack-nhfb, articleno = "10", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Oard:2019:JME, author = "Douglas W. Oard and Fabrizio Sebastiani and Jyothi K. Vinjumur", title = "Jointly Minimizing the Expected Costs of Review for Responsiveness and Privilege in E-Discovery", journal = j-TOIS, volume = "37", number = "1", pages = "11:1--11:??", month = jan, year = "2019", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3268928", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:52:00 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Discovery is an important aspect of the civil litigation process in the United States of America, in which all parties to a lawsuit are permitted to request relevant evidence from other parties. With the rapid growth of digital content, the emerging need for ``e-discovery'' has created a strong demand for techniques that can be used to review massive collections both for ``responsiveness'' (i.e., relevance) to the request and for ``privilege'' (i.e., presence of legally protected content that the party performing the review may have a right to withhold). In this process, the party performing the review may incur costs of two types, namely, annotation costs (deriving from the fact that human reviewers need to be paid for their work) and misclassification costs (deriving from the fact that failing to correctly determine the responsiveness or privilege of a document may adversely affect the interests of the parties in various ways). Relying exclusively on automatic classification would minimize annotation costs but could result in substantial misclassification costs, while relying exclusively on manual classification could generate the opposite consequences. This article proposes a risk minimization framework (called MINECORE, for ``minimizing the expected costs of review'') that seeks to strike an optimal balance between these two extreme stands. In MINECORE (a) the documents are first automatically classified for both responsiveness and privilege, and then (b) some of the automatically classified documents are annotated by human reviewers for responsiveness (typically by junior reviewers) and/or, in cascade, for privilege (typically by senior reviewers), with the overall goal of minimizing the expected cost (i.e., the risk ) of the entire process. Risk minimization is achieved by optimizing, for both responsiveness and privilege, the choice of which documents to manually review. We present a simulation study in which classes from a standard text classification test collection (RCV1-v2) are used as surrogates for responsiveness and privilege. The results indicate that MINECORE can yield substantially lower total cost than any of a set of strong baselines.", acknowledgement = ack-nhfb, articleno = "11", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Chen:2019:ADE, author = "Xu Chen and Yongfeng Zhang and Hongteng Xu and Zheng Qin and Hongyuan Zha", title = "Adversarial Distillation for Efficient Recommendation with External Knowledge", journal = j-TOIS, volume = "37", number = "1", pages = "12:1--12:??", month = jan, year = "2019", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3281659", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:52:00 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Integrating external knowledge into the recommendation system has attracted increasing attention in both industry and academic communities. Recent methods mostly take the power of neural network for effective knowledge representation to improve the recommendation performance. However, the heavy deep architectures in existing models are usually incorporated in an embedded manner, which may greatly increase the model complexity and lower the runtime efficiency. To simultaneously take the power of deep learning for external knowledge modeling as well as maintaining the model efficiency at test time, we reformulate the problem of recommendation with external knowledge into a generalized distillation framework. The general idea is to free the complex deep architecture into a separate model, which is only used in the training phrase, while abandoned at test time. In particular, in the training phrase, the external knowledge is processed by a comprehensive teacher model to produce valuable information to teach a simple and efficient student model. Once the framework is learned, the teacher model is abandoned, and only the succinct yet enhanced student model is used to make fast predictions at test time. In this article, we specify the external knowledge as user review, and to leverage it in an effective manner, we further extend the traditional generalized distillation framework by designing a Selective Distillation Network (SDNet) with adversarial adaption and orthogonality constraint strategies to make it more robust to noise information. Extensive experiments verify that our model can not only improve the performance of rating prediction, but also can significantly reduce time consumption when making predictions as compared with several state-of-the-art methods.", acknowledgement = ack-nhfb, articleno = "12", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Cornolti:2019:SPA, author = "Marco Cornolti and Paolo Ferragina and Massimiliano Ciaramita and Stefan R{\"u}d and Hinrich Sch{\"u}tze", title = "{SMAPH}: a Piggyback Approach for Entity-Linking in {Web} Queries", journal = j-TOIS, volume = "37", number = "1", pages = "13:1--13:??", month = jan, year = "2019", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3284102", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:52:00 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "We study the problem of linking the terms of a web-search query to a semantic representation given by the set of entities (a.k.a. concepts) mentioned in it. We introduce SMAPH, a system that performs this task using the information coming from a web search engine, an approach we call ``piggybacking.'' We employ search engines to alleviate the noise and irregularities that characterize the language of queries. Snippets returned as search results also provide a context for the query that makes it easier to disambiguate the meaning of the query. From the search results, SMAPH builds a set of candidate entities with high coverage. This set is filtered by linking back the candidate entities to the terms occurring in the input query, ensuring high precision. A greedy disambiguation algorithm performs this filtering; it maximizes the coherence of the solution by iteratively discovering the pertinent entities mentioned in the query. We propose three versions of SMAPH that outperform state-of-the-art solutions on the known benchmarks and on the GERDAQ dataset, a novel dataset that we have built specifically for this problem via crowd-sourcing and that we make publicly available.", acknowledgement = ack-nhfb, articleno = "13", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Niu:2019:UFS, author = "Xi Niu and Xiangyu Fan and Tao Zhang", title = "Understanding Faceted Search from Data Science and Human Factor Perspectives", journal = j-TOIS, volume = "37", number = "2", pages = "14:1--14:??", month = mar, year = "2019", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3284101", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:52:00 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/ft_gateway.cfm?id=3284101", abstract = "Faceted search has become a common feature on most search interfaces in e-commerce websites, digital libraries, government's open information portals, and so on. Beyond the existing studies on developing algorithms for faceted search and empirical studies on facet usage, this study investigated user real-time interactions with facets over the course of a search from both data science and human factor perspectives. It adopted a Random Forest (RF) model to successfully predict facet use using search dynamic variables. In addition, the RF model provided a ranking of variables by their predictive power, which suggests that the search process follows rhythmic flow of a sequence within which facet addition is mostly influenced by its immediately preceding action. In the follow-up user study, we found that participants used facets at critical points from the beginning to end of search sessions. Participants used facets for distinctive reasons at different stages. They also used facets implicitly without applying the facets to their search. Most participants liked the faceted search, although a few participants were concerned about the choice overload introduced by facets. The results of this research can be used to understand information seekers and propose or refine a set of practical design guidelines for faceted search.", acknowledgement = ack-nhfb, articleno = "14", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Loni:2019:TRM, author = "Babak Loni and Roberto Pagano and Martha Larson and Alan Hanjalic", title = "Top-{$N$} Recommendation with Multi-Channel Positive Feedback using Factorization Machines", journal = j-TOIS, volume = "37", number = "2", pages = "15:1--15:??", month = mar, year = "2019", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3291756", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:52:00 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/ft_gateway.cfm?id=3291756", abstract = "User interactions can be considered to constitute different feedback channels, for example, view, click, like or follow, that provide implicit information on users' preferences. Each implicit feedback channel typically carries a unary, positive-only signal that can be exploited by collaborative filtering models to generate lists of personalized recommendations. This article investigates how a learning-to-rank recommender system can best take advantage of implicit feedback signals from multiple channels. We focus on Factorization Machines (FMs) with Bayesian Personalized Ranking (BPR), a pairwise learning-to-rank method, that allows us to experiment with different forms of exploitation. We perform extensive experiments on three datasets with multiple types of feedback to arrive at a series of insights. We compare conventional, direct integration of feedback types with our proposed method, which exploits multiple feedback channels during the sampling process of training. We refer to our method as multi-channel sampling. Our results show that multi-channel sampling outperforms conventional integration, and that sampling with the relative ``level'' of feedback is always superior to a level-blind sampling approach. We evaluate our method experimentally on three datasets in different domains and observe that with our multi-channel sampler the accuracy of recommendations can be improved considerably compared to the state-of-the-art models. Further experiments reveal that the appropriate sampling method depends on particular properties of datasets such as popularity skewness.", acknowledgement = ack-nhfb, articleno = "15", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Cheng:2019:MER, author = "Zhiyong Cheng and Xiaojun Chang and Lei Zhu and Rose C. Kanjirathinkal and Mohan Kankanhalli", title = "{MMALFM}: Explainable Recommendation by Leveraging Reviews and Images", journal = j-TOIS, volume = "37", number = "2", pages = "16:1--16:??", month = mar, year = "2019", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3291060", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:52:00 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/ft_gateway.cfm?id=3291060", abstract = "Personalized rating prediction is an important research problem in recommender systems. Although the latent factor model (e.g., matrix factorization) achieves good accuracy in rating prediction, it suffers from many problems including cold-start, non-transparency, and suboptimal results for individual user-item pairs. In this article, we exploit textual reviews and item images together with ratings to tackle these limitations. Specifically, we first apply a proposed multi-modal aspect-aware topic model (MATM) on text reviews and item images to model users' preferences and items' features from different aspects, and also estimate the aspect importance of a user toward an item. Then, the aspect importance is integrated into a novel aspect-aware latent factor model (ALFM), which learns user's and item's latent factors based on ratings. In particular, ALFM introduces a weight matrix to associate those latent factors with the same set of aspects in MATM, such that the latent factors could be used to estimate aspect ratings. Finally, the overall rating is computed via a linear combination of the aspect ratings, which are weighted by the corresponding aspect importance. To this end, our model could alleviate the data sparsity problem and gain good interpretability for recommendation. Besides, every aspect rating is weighted by its aspect importance, which is dependent on the targeted user's preferences and the targeted item's features. Therefore, it is expected that the proposed method can model a user's preferences on an item more accurately for each user-item pair. Comprehensive experimental studies have been conducted on the Yelp 2017 Challenge dataset and Amazon product datasets. Results show that (1) our method achieves significant improvement compared to strong baseline methods, especially for users with only few ratings; (2) item visual features can improve the prediction performance-the effects of item image features on improving the prediction results depend on the importance of the visual features for the items; and (3) our model can explicitly interpret the predicted results in great detail.", acknowledgement = ack-nhfb, articleno = "16", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Chong:2019:FGG, author = "Wen-Haw Chong and Ee-Peng Lim", title = "Fine-grained Geolocation of Tweets in Temporal Proximity", journal = j-TOIS, volume = "37", number = "2", pages = "17:1--17:??", month = mar, year = "2019", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3291059", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:52:00 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/ft_gateway.cfm?id=3291059", abstract = "In fine-grained tweet geolocation, tweets are linked to the specific venues (e.g., restaurants, shops) from which they were posted. This explicitly recovers the venue context that is essential for applications such as location-based advertising or user profiling. For this geolocation task, we focus on geolocating tweets that are contained in tweet sequences. In a tweet sequence, tweets are posted from some latent venue(s) by the same user and within a short time interval. This scenario arises from two observations: (1) It is quite common that users post multiple tweets in a short time and (2) most tweets are not geocoded. To more accurately geolocate a tweet, we propose a model that performs query expansion on the tweet (query) using two novel approaches. The first approach temporal query expansion considers users' staying behavior around venues. The second approach visitation query expansion leverages on user revisiting the same or similar venues in the past. We combine both query expansion approaches via a novel fusion framework and overlay them on a Hidden Markov Model to account for sequential information. In our comprehensive experiments across multiple datasets and metrics, we show our proposed model to be more robust and accurate than other baselines.", acknowledgement = ack-nhfb, articleno = "17", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Qian:2019:SRL, author = "Tieyun Qian and Bei Liu and Quoc Viet Hung Nguyen and Hongzhi Yin", title = "Spatiotemporal Representation Learning for Translation-Based {POI} Recommendation", journal = j-TOIS, volume = "37", number = "2", pages = "18:1--18:??", month = mar, year = "2019", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3295499", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:52:00 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/ft_gateway.cfm?id=3295499", abstract = "The increasing proliferation of location-based social networks brings about a huge volume of user check-in data, which facilitates the recommendation of points of interest (POIs). Time and location are the two most important contextual factors in the user's decision-making for choosing a POI to visit. In this article, we focus on the spatiotemporal context-aware POI recommendation, which considers the joint effect of time and location for POI recommendation. Inspired by the recent advances in knowledge graph embedding, we propose a spatiotemporal context-aware and translation-based recommender framework (STA) to model the third-order relationship among users, POIs, and spatiotemporal contexts for large-scale POI recommendation. Specifically, we embed both users and POIs into a ``transition space'' where spatiotemporal contexts (i.e., a \< time, location \> pair) are modeled as translation vectors operating on users and POIs. We further develop a series of strategies to exploit various correlation information to address the data sparsity and cold-start issues for new spatiotemporal contexts, new users, and new POIs. We conduct extensive experiments on two real-world datasets. The experimental results demonstrate that our STA framework achieves the superior performance in terms of high recommendation accuracy, robustness to data sparsity, and effectiveness in handling the cold-start problem.", acknowledgement = ack-nhfb, articleno = "18", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Guo:2019:ALS, author = "Yangyang Guo and Zhiyong Cheng and Liqiang Nie and Yinglong Wang and Jun Ma and Mohan Kankanhalli", title = "Attentive Long Short-Term Preference Modeling for Personalized Product Search", journal = j-TOIS, volume = "37", number = "2", pages = "19:1--19:??", month = mar, year = "2019", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3295822", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:52:00 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/ft_gateway.cfm?id=3295822", abstract = "E-commerce users may expect different products even for the same query, due to their diverse personal preferences. It is well known that there are two types of preferences: long-term ones and short-term ones. The former refers to users' inherent purchasing bias and evolves slowly. By contrast, the latter reflects users' purchasing inclination in a relatively short period. They both affect users' current purchasing intentions. However, few research efforts have been dedicated to jointly model them for the personalized product search. To this end, we propose a novel Attentive Long Short-Term Preference model, dubbed as ALSTP, for personalized product search. Our model adopts the neural networks approach to learn and integrate the long- and short-term user preferences with the current query for the personalized product search. In particular, two attention networks are designed to distinguish which factors in the short-term as well as long-term user preferences are more relevant to the current query. This unique design enables our model to capture users' current search intentions more accurately. Our work is the first to apply attention mechanisms to integrate both long- and short-term user preferences with the given query for the personalized search. Extensive experiments over four Amazon product datasets show that our model significantly outperforms several state-of-the-art product search methods in terms of different evaluation metrics.", acknowledgement = ack-nhfb, articleno = "19", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Lukasik:2019:GPR, author = "Michal Lukasik and Kalina Bontcheva and Trevor Cohn and Arkaitz Zubiaga and Maria Liakata and Rob Procter", title = "{Gaussian} Processes for Rumour Stance Classification in Social Media", journal = j-TOIS, volume = "37", number = "2", pages = "20:1--20:??", month = mar, year = "2019", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3295823", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:52:00 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/ft_gateway.cfm?id=3295823", abstract = "Social media tend to be rife with rumours while new reports are released piecemeal during breaking news. Interestingly, one can mine multiple reactions expressed by social media users in those situations, exploring their stance towards rumours, ultimately enabling the flagging of highly disputed rumours as being potentially false. In this work, we set out to develop an automated, supervised classifier that uses multi-task learning to classify the stance expressed in each individual tweet in a conversation around a rumour as either supporting, denying or questioning the rumour. Using a Gaussian Process classifier, and exploring its effectiveness on two datasets with very different characteristics and varying distributions of stances, we show that our approach consistently outperforms competitive baseline classifiers. Our classifier is especially effective in estimating the distribution of different types of stance associated with a given rumour, which we set forth as a desired characteristic for a rumour-tracking system that will show both ordinary users of Twitter and professional news practitioners how others orient to the disputed veracity of a rumour, with the final aim of establishing its actual truth value.", acknowledgement = ack-nhfb, articleno = "20", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Cagliero:2019:EMD, author = "Luca Cagliero and Paolo Garza and Elena Baralis", title = "{ELSA}: a Multilingual Document Summarization Algorithm Based on Frequent Itemsets and Latent Semantic Analysis", journal = j-TOIS, volume = "37", number = "2", pages = "21:1--21:??", month = mar, year = "2019", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3298987", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:52:00 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/ft_gateway.cfm?id=3298987", abstract = "Sentence-based summarization aims at extracting concise summaries of collections of textual documents. Summaries consist of a worthwhile subset of document sentences. The most effective multilingual strategies rely on Latent Semantic Analysis (LSA) and on frequent itemset mining, respectively. LSA-based summarizers pick the document sentences that cover the most important concepts. Concepts are modeled as combinations of single-document terms and are derived from a term-by-sentence matrix by exploiting Singular Value Decomposition (SVD). Itemset-based summarizers pick the sentences that contain the largest number of frequent itemsets, which represent combinations of frequently co-occurring terms. The main drawbacks of existing approaches are (i) the inability of LSA to consider the correlation between combinations of multiple-document terms and the underlying concepts, (ii) the inherent redundancy of frequent itemsets because similar itemsets may be related to the same concept, and (iii) the inability of itemset-based summarizers to correlate itemsets with the underlying document concepts. To overcome the issues of both of the abovementioned algorithms, we propose a new summarization approach that exploits frequent itemsets to describe all of the latent concepts covered by the documents under analysis and LSA to reduce the potentially redundant set of itemsets to a compact set of uncorrelated concepts. The summarizer selects the sentences that cover the latent concepts with minimal redundancy. We tested the summarization algorithm on both multilingual and English-language benchmark document collections. The proposed approach performed significantly better than both itemset- and LSA-based summarizers, and better than most of the other state-of-the-art approaches.", acknowledgement = ack-nhfb, articleno = "21", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Wu:2019:CAU, author = "Libing Wu and Cong Quan and Chenliang Li and Qian Wang and Bolong Zheng and Xiangyang Luo", title = "A Context-Aware User-Item Representation Learning for Item Recommendation", journal = j-TOIS, volume = "37", number = "2", pages = "22:1--22:??", month = mar, year = "2019", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3298988", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:52:00 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/ft_gateway.cfm?id=3298988", abstract = "Both reviews and user-item interactions (i.e., rating scores) have been widely adopted for user rating prediction. However, these existing techniques mainly extract the latent representations for users and items in an independent and static manner. That is, a single static feature vector is derived to encode user preference without considering the particular characteristics of each candidate item. We argue that this static encoding scheme is incapable of fully capturing users' preferences, because users usually exhibit different preferences when interacting with different items. In this article, we propose a novel context-aware user-item representation learning model for rating prediction, named CARL. CARL derives a joint representation for a given user-item pair based on their individual latent features and latent feature interactions. Then, CARL adopts Factorization Machines to further model higher order feature interactions on the basis of the user-item pair for rating prediction. Specifically, two separate learning components are devised in CARL to exploit review data and interaction data, respectively: review-based feature learning and interaction-based feature learning. In the review-based learning component, with convolution operations and attention mechanism, the pair-based relevant features for the given user-item pair are extracted by jointly considering their corresponding reviews. However, these features are only review-driven and may not be comprehensive. Hence, an interaction-based learning component further extracts complementary features from interaction data alone, also on the basis of user-item pairs. The final rating score is then derived with a dynamic linear fusion mechanism. Experiments on seven real-world datasets show that CARL achieves significantly better rating prediction accuracy than existing state-of-the-art alternatives. Also, with the attention mechanism, we show that the pair-based relevant information (i.e., context-aware information) in reviews can be highlighted to interpret the rating prediction for different user-item pairs.", acknowledgement = ack-nhfb, articleno = "22", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Liu:2019:MVB, author = "Ming Liu and Gu Gong and Bing Qin and Ting Liu", title = "A Multi-View-Based Collective Entity Linking Method", journal = j-TOIS, volume = "37", number = "2", pages = "23:1--23:??", month = mar, year = "2019", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3300197", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:52:00 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/ft_gateway.cfm?id=3300197", abstract = "Facing lots of name mentions appearing on the web, entity linking is essential for many information processing applications. To improve linking accuracy, the relations between entities are usually considered in the linking process. This kind of method is called collective entity linking and can obtain high-quality results. There are two kinds of information helpful to reveal the relations between entities, i.e., contextual information and structural information of entities. Most traditional collective entity linking methods consider them separately. In fact, these two kinds of information represent entities from specific and diverse views and can enhance each other, respectively. Besides, if we look into each view closely, it can be separated into sub-views that are more meaningful. For this reason, this article proposes a multi-view-based collective entity linking algorithm, which combines several views of entities into an objective function for entity linking. The importance of each view can be valued and the linking results can be obtained along with resolving this objective function. Experimental results demonstrate that our linking algorithm can acquire higher accuracy than many state-of-the-art entity linking methods. Besides, since we simplify the entity's structure and change the entity linking to a sub-matrix searching problem, our algorithm also obtains high efficiency.", acknowledgement = ack-nhfb, articleno = "23", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Sousa:2019:RSL, author = "Daniel Xavier Sousa and S{\'e}rgio Canuto and Marcos Andr{\'e} Gon{\c{c}}alves and Thierson Couto Rosa and Wellington Santos Martins", title = "Risk-Sensitive Learning to Rank with Evolutionary Multi-Objective Feature Selection", journal = j-TOIS, volume = "37", number = "2", pages = "24:1--24:??", month = mar, year = "2019", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3300196", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:52:00 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/ft_gateway.cfm?id=3300196", abstract = "Learning to Rank (L2R) is one of the main research lines in Information Retrieval. Risk-sensitive L2R is a sub-area of L2R that tries to learn models that are good on average while at the same time reducing the risk of performing poorly in a few but important queries (e.g., medical or legal queries). One way of reducing risk in learned models is by selecting and removing noisy, redundant features, or features that promote some queries to the detriment of others. This is exacerbated by learning methods that usually maximize an average metric (e.g., mean average precision (MAP) or Normalized Discounted Cumulative Gain (NDCG)). However, historically, feature selection (FS) methods have focused only on effectiveness and feature reduction as the main objectives. Accordingly, in this work, we propose to evaluate FS for L2R with an additional objective in mind, namely risk-sensitiveness. We present novel single and multi-objective criteria to optimize feature reduction, effectiveness, and risk-sensitiveness, all at the same time. We also introduce a new methodology to explore the search space, suggesting effective and efficient extensions of a well-known Evolutionary Algorithm (SPEA2) for FS applied to L2R. Our experiments show that explicitly including risk as an objective criterion is crucial to achieving a more effective and risk-sensitive performance. We also provide a thorough analysis of our methodology and experimental results.", acknowledgement = ack-nhfb, articleno = "24", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Pibiri:2019:HMG, author = "Giulio Ermanno Pibiri and Rossano Venturini", title = "Handling Massive {$N$}-Gram Datasets Efficiently", journal = j-TOIS, volume = "37", number = "2", pages = "25:1--25:??", month = mar, year = "2019", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3302913", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:52:00 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/ft_gateway.cfm?id=3302913", abstract = "Two fundamental problems concern the handling of large n -gram language models: indexing, that is, compressing the n -grams and associated satellite values without compromising their retrieval speed, and estimation, that is, computing the probability distribution of the n -grams extracted from a large textual source. Performing these two tasks efficiently is vital for several applications in the fields of Information Retrieval, Natural Language Processing, and Machine Learning, such as auto-completion in search engines and machine translation. Regarding the problem of indexing, we describe compressed, exact, and lossless data structures that simultaneously achieve high space reductions and no time degradation with respect to the state-of-the-art solutions and related software packages. In particular, we present a compressed trie data structure in which each word of an n -gram following a context of fixed length k, that is, its preceding k words, is encoded as an integer whose value is proportional to the number of words that follow such context. Since the number of words following a given context is typically very small in natural languages, we lower the space of representation to compression levels that were never achieved before, allowing the indexing of billions of strings. Despite the significant savings in space, our technique introduces a negligible penalty at query time. Specifically, the most space-efficient competitors in the literature, which are both quantized and lossy, do not take less than our trie data structure and are up to 5 times slower. Conversely, our trie is as fast as the fastest competitor but also retains an advantage of up to 65\% in absolute space. Regarding the problem of estimation, we present a novel algorithm for estimating modified Kneser-Ney language models that have emerged as the de-facto choice for language modeling in both academia and industry thanks to their relatively low perplexity performance. Estimating such models from large textual sources poses the challenge of devising algorithms that make a parsimonious use of the disk. The state-of-the-art algorithm uses three sorting steps in external memory: we show an improved construction that requires only one sorting step by exploiting the properties of the extracted n -gram strings. With an extensive experimental analysis performed on billions of n -grams, we show an average improvement of 4.5 times on the total runtime of the previous approach.", acknowledgement = ack-nhfb, articleno = "25", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Zhan:2019:LMA, author = "Xueying Zhan and Yaowei Wang and Yanghui Rao and Qing Li", title = "Learning from Multi-annotator Data: a Noise-aware Classification Framework", journal = j-TOIS, volume = "37", number = "2", pages = "26:1--26:??", month = mar, year = "2019", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3309543", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:52:00 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/ft_gateway.cfm?id=3309543", abstract = "In the field of sentiment analysis and emotion detection in social media, or other tasks such as text classification involving supervised learning, researchers rely more heavily on large and accurate labelled training datasets. However, obtaining large-scale labelled datasets is time-consuming and high-quality labelled datasets are expensive and scarce. To deal with these problems, online crowdsourcing systems provide us an efficient way to accelerate the process of collecting training data via distributing the enormous tasks to various annotators to help create large amounts of labelled data at an affordable cost. Nowadays, these crowdsourcing platforms are heavily needed in dealing with social media text, since the social network platforms (e.g., Twitter) generate huge amounts of data in textual form everyday. However, people from different social and knowledge backgrounds have different views on various texts, which may lead to noisy labels. The existing noisy label aggregation/refinement algorithms mostly focus on aggregating labels from noisy annotations, which would not guarantee their effectiveness on the subsequent classification/ranking tasks. In this article, we propose a noise-aware classification framework that integrates the steps of noisy label aggregation and classification. The aggregated noisy crowd labels are fed into a classifier for training, while the predicted labels are employed as feedback for adjusting the parameters at the label aggregating stage. The classification framework is suitable for directly running on crowdsourcing datasets and applies to various kinds of classification algorithms. The feedback strategy makes it possible for us to find optimal parameters instead of using known data for parameter selection. Simulation experiments demonstrate that our method provide significant label aggregation performance for both binary and multiple classification tasks under various noisy environments. Experimenting on real-world data validates the feasibility of our framework in real noise data and helps us verify the reasonableness of the simulated experiment settings.", acknowledgement = ack-nhfb, articleno = "26", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Feng:2019:TRR, author = "Fuli Feng and Xiangnan He and Xiang Wang and Cheng Luo and Yiqun Liu and Tat-Seng Chua", title = "Temporal Relational Ranking for Stock Prediction", journal = j-TOIS, volume = "37", number = "2", pages = "27:1--27:??", month = mar, year = "2019", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3309547", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:52:00 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/ft_gateway.cfm?id=3309547", abstract = "Stock prediction aims to predict the future trends of a stock in order to help investors make good investment decisions. Traditional solutions for stock prediction are based on time-series models. With the recent success of deep neural networks in modeling sequential data, deep learning has become a promising choice for stock prediction. However, most existing deep learning solutions are not optimized toward the target of investment, i.e., selecting the best stock with the highest expected revenue. Specifically, they typically formulate stock prediction as a classification (to predict stock trends) or a regression problem (to predict stock prices). More importantly, they largely treat the stocks as independent of each other. The valuable signal in the rich relations between stocks (or companies), such as two stocks are in the same sector and two companies have a supplier-customer relation, is not considered. In this work, we contribute a new deep learning solution, named Relational Stock Ranking (RSR), for stock prediction. Our RSR method advances existing solutions in two major aspects: (1) tailoring the deep learning models for stock ranking, and (2) capturing the stock relations in a time-sensitive manner. The key novelty of our work is the proposal of a new component in neural network modeling, named Temporal Graph Convolution, which jointly models the temporal evolution and relation network of stocks. To validate our method, we perform back-testing on the historical data of two stock markets, NYSE and NASDAQ. Extensive experiments demonstrate the superiority of our RSR method. It outperforms state-of-the-art stock prediction solutions achieving an average return ratio of 98\% and 71\% on NYSE and NASDAQ, respectively.", acknowledgement = ack-nhfb, articleno = "27", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Guan:2019:AAM, author = "Xinyu Guan and Zhiyong Cheng and Xiangnan He and Yongfeng Zhang and Zhibo Zhu and Qinke Peng and Tat-Seng Chua", title = "Attentive Aspect Modeling for Review-Aware Recommendation", journal = j-TOIS, volume = "37", number = "3", pages = "28:1--28:??", month = jul, year = "2019", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3309546", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:52:00 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/ft_gateway.cfm?id=3309546", abstract = "In recent years, many studies extract aspects from user reviews and integrate them with ratings for improving the recommendation performance. The common aspects mentioned in a user's reviews and a product's reviews indicate indirect connections between the user and product. However, these aspect-based methods suffer from two problems. First, the common aspects are usually very sparse, which is caused by the sparsity of user-product interactions and the diversity of individual users' vocabularies. Second, a user's interests on aspects could be different with respect to different products, which are usually assumed to be static in existing methods. In this article, we propose an Attentive Aspect-based Recommendation Model (AARM) to tackle these challenges. For the first problem, to enrich the aspect connections between user and product, besides common aspects, AARM also models the interactions between synonymous and similar aspects. For the second problem, a neural attention network which simultaneously considers user, product, and aspect information is constructed to capture a user's attention toward aspects when examining different products. Extensive quantitative and qualitative experiments show that AARM can effectively alleviate the two aforementioned problems and significantly outperforms several state-of-the-art recommendation methods on the top-N recommendation task.", acknowledgement = ack-nhfb, articleno = "28", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Shao:2019:AMI, author = "Yunqiu Shao and Yiqun Liu and Fan Zhang and Min Zhang and Shaoping Ma", title = "On Annotation Methodologies for Image Search Evaluation", journal = j-TOIS, volume = "37", number = "3", pages = "29:1--29:??", month = jul, year = "2019", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3309994", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:52:00 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/ft_gateway.cfm?id=3309994", abstract = "Image search engines differ significantly from general web search engines in the way of presenting search results. The difference leads to different interaction and examination behavior patterns, and therefore requires changes in evaluation methodologies. However, evaluation of image search still utilizes the methods for general web search. In particular, offline metrics are calculated based on coarse-fine topical relevance judgments with the assumption that users examine results in a sequential manner. In this article, we investigate annotation methods via crowdsourcing for image search evaluation based on a lab-based user study. Using user satisfaction as the golden standard, we make several interesting findings. First, instead of item-based annotation, annotating relevance in a row-based way is more efficient without hurting performance. Second, besides topical relevance, image quality plays a crucial role when evaluating the image search results, and the importance of image quality changes with search intent. Third, compared to traditional four-level scales, the fine-grain annotation method outperforms significantly. To our best knowledge, our work is the first to systematically study how diverse factors in data annotation impact image search evaluation. Our results suggest different strategies for exploiting the crowdsourcing to get data annotated under different conditions.", acknowledgement = ack-nhfb, articleno = "29", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Ferro:2019:UCS, author = "Nicola Ferro and Yubin Kim and Mark Sanderson", title = "Using Collection Shards to Study Retrieval Performance Effect Sizes", journal = j-TOIS, volume = "37", number = "3", pages = "30:1--30:??", month = jul, year = "2019", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3310364", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:52:00 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/ft_gateway.cfm?id=3310364", abstract = "Despite the bulk of research studying how to more accurately compare the performance of IR systems, less attention is devoted to better understanding the different factors that play a role in such performance and how they interact. This is the case of shards, i.e., partitioning a document collection into sub-parts, which are used for many different purposes, ranging from efficiency to selective search or making test collection evaluation more accurate. In all these cases, there is empirical knowledge supporting the importance of shards, but we lack actual models that allow us to measure the impact of shards on system performance and how they interact with topics and systems. We use the general linear mixed model framework and present a model that encompasses the experimental factors of system, topic, shard, and their interaction effects. This detailed model allows us to more accurately estimate differences between the effect of various factors. We study shards created by a range of methods used in prior work and better explain observations noted in prior work in a principled setting and offer new insights. Notably, we discover that the topic*shard interaction effect, in particular, is a large effect almost globally across all datasets, an observation that, to our knowledge, has not been measured before.", acknowledgement = ack-nhfb, articleno = "30", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Li:2019:PRP, author = "Xinyi Li and Yifan Chen and Benjamin Pettit and Maarten {De Rijke}", title = "Personalised Reranking of Paper Recommendations Using Paper Content and User Behavior", journal = j-TOIS, volume = "37", number = "3", pages = "31:1--31:??", month = jul, year = "2019", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3312528", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:52:00 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/ft_gateway.cfm?id=3312528", abstract = "Academic search engines have been widely used to access academic papers, where users' information needs are explicitly represented as search queries. Some modern recommender systems have taken one step further by predicting users' information needs without the presence of an explicit query. In this article, we examine an academic paper recommender that sends out paper recommendations in email newsletters, based on the users' browsing history on the academic search engine. Specifically, we look at users who regularly browse papers on the search engine, and we sign up for the recommendation newsletters for the first time. We address the task of reranking the recommendation candidates that are generated by a production system for such users. We face the challenge that the users on whom we focus have not interacted with the recommender system before, which is a common scenario that every recommender system encounters when new users sign up. We propose an approach to reranking candidate recommendations that utilizes both paper content and user behavior. The approach is designed to suit the characteristics unique to our academic recommendation setting. For instance, content similarity measures can be used to find the closest match between candidate recommendations and the papers previously browsed by the user. To this end, we use a knowledge graph derived from paper metadata to compare entity similarities (papers, authors, and journals) in the embedding space. Since the users on whom we focus have no prior interactions with the recommender system, we propose a model to learn a mapping from users' browsed articles to user clicks on the recommendations. We combine both content and behavior into a hybrid reranking model that outperforms the production baseline significantly, providing a relative 13\% increase in Mean Average Precision and 28\% in Precision@1. Moreover, we provide a detailed analysis of the model components, highlighting where the performance boost comes from. The obtained insights reveal useful components for the reranking process and can be generalized to other academic recommendation settings as well, such as the utility of graph embedding similarity. Also, recent papers browsed by users provide stronger evidence for recommendation than historical ones.", acknowledgement = ack-nhfb, articleno = "31", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Wang:2019:EHO, author = "Hongwei Wang and Fuzheng Zhang and Jialin Wang and Miao Zhao and Wenjie Li and Xing Xie and Minyi Guo", title = "Exploring High-Order User Preference on the Knowledge Graph for Recommender Systems", journal = j-TOIS, volume = "37", number = "3", pages = "32:1--32:??", month = jul, year = "2019", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3312738", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:52:00 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/ft_gateway.cfm?id=3312738", abstract = "To address the sparsity and cold-start problem of collaborative filtering, researchers usually make use of side information, such as social networks or item attributes, to improve the performance of recommendation. In this article, we consider the knowledge graph (KG) as the source of side information. To address the limitations of existing embedding-based and path-based methods for KG-aware recommendation, we propose RippleNet, an end-to-end framework that naturally incorporates the KG into recommender systems. RippleNet has two versions: (1) The outward propagation version, which is analogous to the actual ripples on water, stimulates the propagation of user preferences over the set of knowledge entities by automatically and iteratively extending a user's potential interests along links in the KG. The multiple ``ripples'' activated by a user's historically clicked items are thus superposed to form the preference distribution of the user with respect to a candidate item. (2) The inward aggregation version aggregates and incorporates the neighborhood information biasedly when computing the representation of a given entity. The neighborhood can be extended to multiple hops away to model high-order proximity and capture users' long-distance interests. In addition, we intuitively demonstrate how a KG assists with recommender systems in RippleNet, and we also find that RippleNet provides a new perspective of explainability for the recommended results in terms of the KG. Through extensive experiments on real-world datasets, we demonstrate that both versions of RippleNet achieve substantial gains in a variety of scenarios, including movie, book, and news recommendations, over several state-of-the-art baselines.", acknowledgement = ack-nhfb, articleno = "32", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Xue:2019:DIB, author = "Feng Xue and Xiangnan He and Xiang Wang and Jiandong Xu and Kai Liu and Richang Hong", title = "Deep Item-based Collaborative Filtering for Top-{$N$} Recommendation", journal = j-TOIS, volume = "37", number = "3", pages = "33:1--33:??", month = jul, year = "2019", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3314578", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:52:00 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/ft_gateway.cfm?id=3314578", abstract = "Item-based Collaborative Filtering (ICF) has been widely adopted in recommender systems in industry, owing to its strength in user interest modeling and ease in online personalization. By constructing a user's profile with the items that the user has consumed, ICF recommends items that are similar to the user's profile. With the prevalence of machine learning in recent years, significant processes have been made for ICF by learning item similarity (or representation) from data. Nevertheless, we argue that most existing works have only considered linear and shallow relationships between items, which are insufficient to capture the complicated decision-making process of users. In this article, we propose a more expressive ICF solution by accounting for the nonlinear and higher-order relationships among items. Going beyond modeling only the second-order interaction (e.g., similarity) between two items, we additionally consider the interaction among all interacted item pairs by using nonlinear neural networks. By doing this, we can effectively model the higher-order relationship among items, capturing more complicated effects in user decision-making. For example, it can differentiate which historical itemsets in a user's profile are more important in affecting the user to make a purchase decision on an item. We treat this solution as a deep variant of ICF, thus term it as DeepICF. To justify our proposal, we perform empirical studies on two public datasets from MovieLens and Pinterest. Extensive experiments verify the highly positive effect of higher-order item interaction modeling with nonlinear neural networks. Moreover, we demonstrate that by more fine-grained second-order interaction modeling with attention network, the performance of our DeepICF method can be further improved.", acknowledgement = ack-nhfb, articleno = "33", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Zhang:2019:MAD, author = "Zheng Zhang and Minlie Huang and Zhongzhou Zhao and Feng Ji and Haiqing Chen and Xiaoyan Zhu", title = "Memory-Augmented Dialogue Management for Task-Oriented Dialogue Systems", journal = j-TOIS, volume = "37", number = "3", pages = "34:1--34:??", month = jul, year = "2019", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3317612", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:52:00 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/ft_gateway.cfm?id=3317612", abstract = "Dialogue management (DM) is responsible for predicting the next action of a dialogue system according to the current dialogue state and thus plays a central role in task-oriented dialogue systems. Since DM requires having access not only to local utterances but also to the global semantics of the entire dialogue session, modeling the long-range history information is a critical issue. To this end, we propose MAD, a novel memory-augmented dialogue management model that employs a memory controller and two additional memory structures (i.e., a slot-value memory and an external memory). The slot-value memory tracks the dialogue state by memorizing and updating the values of semantic slots (i.e., cuisine, price, and location), and the external memory augments the representation of hidden states of traditional recurrent neural networks by storing more context information. To update the dialogue state efficiently, we also propose slot-level attention on user utterances to extract specific semantic information for each slot. Experiments show that our model can obtain state-of-the-art performance and outperforms existing baselines.", acknowledgement = ack-nhfb, articleno = "34", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Wu:2019:DDA, author = "Zhijing Wu and Ke Zhou and Yiqun Liu and Min Zhang and Shaoping Ma", title = "Does Diversity Affect User Satisfaction in Image Search", journal = j-TOIS, volume = "37", number = "3", pages = "35:1--35:??", month = jul, year = "2019", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3320118", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:52:00 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/ft_gateway.cfm?id=3320118", abstract = "Diversity has been taken into consideration by existing Web image search engines in ranking search results. However, there is no thorough investigation of how diversity affects user satisfaction in image search. In this article, we address the following questions: (1) How do different factors, such as content and visual presentations, affect users' perception of diversity? (2) How does search result diversity affect user satisfaction with different search intents? To answer those questions, we conduct a set of laboratory user studies to collect users' perceived diversity annotations and search satisfaction. We find that the existence of nearly duplicated image results has the largest impact on users' perceived diversity, followed by the similarity in content and visual presentations. Besides these findings, we also investigate the relationship between diversity and satisfaction in image search. Specifically, we find that users' preference for diversity varies across different search intents. When users want to collect information or save images for further usage (the Locate search tasks), more diversified result lists lead to higher satisfaction levels. The insights may help commercial image search engines to design better result ranking strategies and evaluation metrics.", acknowledgement = ack-nhfb, articleno = "35", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Arguello:2019:EWM, author = "Jaime Arguello and Bogeum Choi", title = "The Effects of Working Memory, Perceptual Speed, and Inhibition in Aggregated Search", journal = j-TOIS, volume = "37", number = "3", pages = "36:1--36:??", month = jul, year = "2019", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3322128", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:52:00 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/ft_gateway.cfm?id=3322128", abstract = "Prior work has studied how different characteristics of individual users (e.g., personality traits and cognitive abilities) can impact search behaviors and outcomes. We report on a laboratory study ( N = 32) that investigated the effects of three different cognitive abilities (perceptual speed, working memory, and inhibition) in the context of aggregated search. Aggregated search systems combine results from multiple heterogeneous sources (or verticals ) in a unified presentation. Participants in our study interacted with two different aggregated search interfaces (a within-subjects design) that differed based on the extent to which the layout distinguished between results originating from different verticals. The interleaved interface merged results from different verticals in a fairly unconstrained fashion. Conversely, the blocked interface displayed results from the same vertical as a group, displayed each group of vertical results in the same region on the SERP for every query, and used a border around each group of vertical results to help distinguish among results from different sources. We investigated three research questions (RQ1--RQ3). Specifically, we investigated the effects of the interface condition and each cognitive ability on three types of outcomes: (RQ1) participants' levels of workload, (RQ2) participants' levels of user engagement, and (RQ3) participants' search behaviors. Our results found different main and interaction effects. Perceptual speed and inhibition did not significantly affect participants' workload and user engagement but significantly affected their search behaviors. Specifically, with the interleaved interface, participants with lower perceptual speed had more difficulty finding relevant results on the SERP, and participants with lower inhibitory attention control searched at a slower pace. Working memory did not have a strong effect on participants' behaviors but had several significant effects on the levels of workload and user engagement reported by participants. Specifically, participants with lower working memory reported higher levels of workload and lower levels of user engagement. We discuss implications of our results for designing aggregated search interfaces that are well suited for users with different cognitive abilities.", acknowledgement = ack-nhfb, articleno = "36", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Esuli:2019:FNE, author = "Andrea Esuli and Alejandro Moreo and Fabrizio Sebastiani", title = "Funnelling: a New Ensemble Method for Heterogeneous Transfer Learning and Its Application to Cross-Lingual Text Classification", journal = j-TOIS, volume = "37", number = "3", pages = "37:1--37:??", month = jul, year = "2019", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3326065", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:52:00 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/ft_gateway.cfm?id=3326065", abstract = "Cross-lingual Text Classification (CLC) consists of automatically classifying, according to a common set C of classes, documents each written in one of a set of languages L, and doing so more accurately than when ``na{\"\i}vely'' classifying each document via its corresponding language-specific classifier. To obtain an increase in the classification accuracy for a given language, the system thus needs to also leverage the training examples written in the other languages. We tackle ``multilabel'' CLC via funnelling, a new ensemble learning method that we propose here. Funnelling consists of generating a two-tier classification system where all documents, irrespective of language, are classified by the same (second-tier) classifier. For this classifier, all documents are represented in a common, language-independent feature space consisting of the posterior probabilities generated by first-tier, language-dependent classifiers. This allows the classification of all test documents, of any language, to benefit from the information present in all training documents, of any language. We present substantial experiments, run on publicly available multilingual text collections, in which funnelling is shown to significantly outperform a number of state-of-the-art baselines. All code and datasets (in vector form) are made publicly available.", acknowledgement = ack-nhfb, articleno = "37", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Liu:2019:SRR, author = "Yiqun Liu and Junqi Zhang and Jiaxin Mao and Min Zhang and Shaoping Ma and Qi Tian and Yanxiong Lu and Leyu Lin", title = "Search Result Reranking with Visual and Structure Information Sources", journal = j-TOIS, volume = "37", number = "3", pages = "38:1--38:??", month = jul, year = "2019", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3329188", ISSN = "1046-8188", bibdate = "Sat Sep 21 11:52:00 MDT 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/ft_gateway.cfm?id=3329188", abstract = "Relevance estimation is among the most important tasks in the ranking of search results. Current methodologies mainly concentrate on text matching, link analysis, and user behavior models. However, users judge the relevance of search results directly from Search Engine Result Pages (SERPs), which provide valuable signals for reranking. In this article, we propose two different approaches to aggregate the visual, structure, as well as textual information sources of search results in relevance estimation. The first one is a late-fusion framework named Joint Relevance Estimation model (JRE). JRE estimates the relevance independently from screenshots, textual contents, and HTML source codes of search results and jointly makes the final decision through an inter-modality attention mechanism. The second one is an early-fusion framework named Tree-based Deep Neural Network (TreeNN), which embeds the texts and images into the HTML parse tree through a recursive process. To evaluate the performance of the proposed models, we construct a large-scale practical Search Result Relevance (SRR) dataset that consists of multiple information sources and relevance labels of over 60,000 search results. Experimental results show that the proposed two models achieve better performance than state-of-the-art ranking solutions as well as the original rankings of commercial search engines.", acknowledgement = ack-nhfb, articleno = "38", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Chen:2019:JNC, author = "Wanyu Chen and Fei Cai and Honghui Chen and Maarten {De Rijke}", title = "Joint Neural Collaborative Filtering for Recommender Systems", journal = j-TOIS, volume = "37", number = "4", pages = "39:1--39:??", month = dec, year = "2019", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3343117", ISSN = "1046-8188", bibdate = "Wed Dec 11 07:07:43 MST 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/ft_gateway.cfm?id=3343117", abstract = "We propose a Joint Neural Collaborative Filtering (J-NCF) method for recommender systems. The J-NCF model applies a joint neural network that couples deep feature learning and deep interaction modeling with a rating matrix. Deep feature learning extracts feature representations of users and items with a deep learning architecture based on a user-item rating matrix. Deep interaction modeling captures non-linear user-item interactions with a deep neural network using the feature representations generated by the deep feature learning process as input. J-NCF enables the deep feature learning and deep interaction modeling processes to optimize each other through joint training, which leads to improved recommendation performance. In addition, we design a new loss function for optimization that takes both implicit and explicit feedback, point-wise and pair-wise loss into account. Experiments on several real-world datasets show significant improvements of J-NCF over state-of-the-art methods, with improvements of up to 8.24\% on the MovieLens 100K dataset, 10.81\% on the MovieLens 1M dataset, and 10.21\% on the Amazon Movies dataset in terms of HR@10. NDCG@10 improvements are 12.42\%, 14.24\%, and 15.06\%, respectively. We also conduct experiments to evaluate the scalability and sensitivity of J-NCF. Our experiments show that the J-NCF model has a competitive recommendation performance with inactive users and different degrees of data sparsity when compared to state-of-the-art baselines.", acknowledgement = ack-nhfb, articleno = "39", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Zhang:2019:QAK, author = "Richong Zhang and Yue Wang and Yongyi Mao and Jinpeng Huai", title = "Question Answering in Knowledge Bases: a Verification Assisted Model with Iterative Training", journal = j-TOIS, volume = "37", number = "4", pages = "40:1--40:??", month = dec, year = "2019", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3345557", ISSN = "1046-8188", bibdate = "Wed Dec 11 07:07:43 MST 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/ft_gateway.cfm?id=3345557", abstract = "Question answering over knowledge bases aims to take full advantage of the information in knowledge bases with the ultimate purpose of returning answers to questions. To access the substantial knowledge within the KB, many model architectures are hindered by the bottleneck of accurately predicting relations that connect subject entities in questions to object entities in the knowledge base. To break the bottleneck, this article presents a novel model architecture, APVA, which includes a verification mechanism to check the correctness of predicted relations. Specifically, APVA takes advantage of KB-based information to improve relation prediction but verifies the correctness of the predicted relation by means of simple negative sampling in a logistic regression framework. The APVA architecture offers a natural way to integrate an iterative training procedure, which we call turbo training. Accordingly, we introduce APVA-TURBO to perform question answering over knowledge bases. We demonstrate extensive experiments to show that APVA-TURBO outperforms existing approaches on question answering.", acknowledgement = ack-nhfb, articleno = "40", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Benham:2019:BSP, author = "Rodger Benham and Joel Mackenzie and Alistair Moffat and J. Shane Culpepper", title = "Boosting Search Performance Using Query Variations", journal = j-TOIS, volume = "37", number = "4", pages = "41:1--41:??", month = dec, year = "2019", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3345001", ISSN = "1046-8188", bibdate = "Wed Dec 11 07:07:43 MST 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/ft_gateway.cfm?id=3345001", abstract = "Rank fusion is a powerful technique that allows multiple sources of information to be combined into a single result set. Query variations covering the same information need represent one way in which different sources of information might arise. However, when implemented in the obvious manner, fusion over query variations is not cost-effective, at odds with the usual web-search requirement for strict per-query efficiency guarantees. In this work, we propose a novel solution to query fusion by splitting the computation into two parts: one phase that is carried out offline, to generate pre-computed centroid answers for queries addressing broadly similar information needs, and then a second online phase that uses the corresponding topic centroid to compute a result page for each query. To achieve this, we make use of score-based fusion algorithms whose costs can be amortized via the pre-processing step and that can then be efficiently combined during subsequent per-query re-ranking operations. Experimental results using the ClueWeb12B collection and the UQV100 query variations demonstrate that centroid-based approaches allow improved retrieval effectiveness at little or no loss in query throughput or latency and within reasonable pre-processing requirements. We additionally show that queries that do not match any of the pre-computed clusters can be accurately identified and efficiently processed in our proposed ranking pipeline.", acknowledgement = ack-nhfb, articleno = "41", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Tamine:2019:OVO, author = "Lynda Tamine and Laure Soulier and Gia-Hung Nguyen and Nathalie Souf", title = "Offline versus Online Representation Learning of Documents Using External Knowledge", journal = j-TOIS, volume = "37", number = "4", pages = "42:1--42:??", month = dec, year = "2019", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3349527", ISSN = "1046-8188", bibdate = "Wed Dec 11 07:07:43 MST 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/ft_gateway.cfm?id=3349527", abstract = "An intensive recent research work investigated the combined use of hand-curated knowledge resources and corpus-driven resources to learn effective text representations. The overall learning process could be run by online revising the learning objective or by offline refining an original learned representation. The differentiated impact of each of the learning approaches on the quality of the learned representations has not been studied so far in the literature. This article focuses on the design of comparable offline vs. online knowledge-enhanced document representation learning models and the comparison of their effectiveness using a set of standard IR and NLP downstream tasks. The results of quantitative and qualitative analyses show that (1) offline vs. online learning approaches have dissimilar result trends regarding the task as well as the dataset distribution counts with regard to domain application; (2) while considering external knowledge resources is undoubtedly beneficial, the way used to express relational constraints could affect semantic inference effectiveness. The findings of this work present opportunities for the design of future representation learning models, but also for providing insights about the evaluation of such models.", acknowledgement = ack-nhfb, articleno = "42", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Zheng:2019:CCM, author = "Yukun Zheng and Jiaxin Mao and Yiqun Liu and Cheng Luo and Min Zhang and Shaoping Ma", title = "Constructing Click Model for Mobile Search with Viewport Time", journal = j-TOIS, volume = "37", number = "4", pages = "43:1--43:??", month = dec, year = "2019", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3360486", ISSN = "1046-8188", bibdate = "Wed Dec 11 07:07:43 MST 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/ft_gateway.cfm?id=3360486", abstract = "A series of click models has been proposed to extract accurate and unbiased relevance feedback from valuable yet noisy click-through data in search logs. Previous works have shown that users search behavior in mobile and desktop scenarios are rather different in many aspects, therefore, the click models designed for desktop search may not be effective in the mobile context. To address this problem, we propose two novel click models for mobile search: (1) Mobile Click Model (MCM), which models click necessity bias and examination satisfaction bias; (2) Viewport Time Click Model (VTCM), which further extends MCM by utilizing the viewport time. Extensive experiments on large-scale real mobile search logs show that: (1) MCM and VTCM outperform existing models in predicting users' clicks and estimating result relevance; (2) MCM and VTCM can extract richer information, such as the click necessity of search results and the probability of user satisfaction, from mobile click logs; (3) By modeling the viewport time distributions of heterogeneous results, VTCM can bring a significant improvement over MCM in click prediction and relevance estimation tasks. Our proposed click models can help better understand user behavior patterns in mobile search and improve the ranking performance of mobile search engines.", acknowledgement = ack-nhfb, articleno = "43", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Raiber:2019:RFW, author = "Fiana Raiber and Oren Kurland", title = "Relevance Feedback: The Whole Is Inferior to the Sum of Its Parts", journal = j-TOIS, volume = "37", number = "4", pages = "44:1--44:??", month = dec, year = "2019", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3360487", ISSN = "1046-8188", bibdate = "Wed Dec 11 07:07:43 MST 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/ft_gateway.cfm?id=3360487", abstract = "Document retrieval methods that utilize relevance feedback often induce a single query model from the set of feedback documents, specifically, the relevant documents. We empirically show that for a few state-of-the-art query-model induction methods, retrieval performance can be significantly improved by constructing the query model from a subset of the relevant documents rather than from all of them. Motivated by this finding, we propose a new approach for relevance-feedback-based retrieval. The approach, derived from the risk minimization framework, is based on utilizing multiple query models induced from all subsets of the given relevant documents. Empirical evaluation shows that the approach posts performance that is statistically significantly better than that of applying the standard practice of utilizing a single query model induced from the relevant documents. While the average relative improvements are small to moderate, the robustness of the approach is substantially higher than that of a variety of reference comparison methods that address various challenges in using relevance feedback.", acknowledgement = ack-nhfb, articleno = "44", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Liu:2019:ALL, author = "Huafeng Liu and Liping Jing and Yuhua Qian and Jian Yu", title = "Adaptive Local Low-rank Matrix Approximation for Recommendation", journal = j-TOIS, volume = "37", number = "4", pages = "45:1--45:??", month = dec, year = "2019", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3360488", ISSN = "1046-8188", bibdate = "Wed Dec 11 07:07:43 MST 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/ft_gateway.cfm?id=3360488", abstract = "Low-rank matrix approximation (LRMA) has attracted more and more attention in the community of recommendation. Even though LRMA-based recommendation methods (including Global LRMA and Local LRMA) obtain promising results, they suffer from the complicated structure of the large-scale and sparse rating matrix, especially when the underlying system includes a large set of items with various types and a huge amount of users with diverse interests. Thus, they have to predefine the important parameters, such as the rank of the rating matrix and the number of submatrices. Moreover, most existing Local LRMA methods are usually designed in a two-phase separated framework and do not consider the missing mechanisms of rating matrix. In this article, a non-parametric unified Bayesian graphical model is proposed for Adaptive Local low-rank Matrix Approximation (ALoMA). ALoMA has ability to simultaneously identify rating submatrices, determine the optimal rank for each submatrix, and learn the submatrix-specific user/item latent factors. Meanwhile, the missing mechanism is adopted to characterize the whole rating matrix. These four parts are seamlessly integrated and enhance each other in a unified framework. Specifically, the user-item rating matrix is adaptively divided into proper number of submatrices in ALoMA by exploiting the Chinese Restaurant Process. For each submatrix, by considering both global/local structure information and missing mechanisms, the latent user/item factors are identified in an optimal latent space by adopting automatic relevance determination technique. We theoretically analyze the model's generalization error bounds and give an approximation guarantee. Furthermore, an efficient Gibbs sampling-based algorithm is designed to infer the proposed model. A series of experiments have been conducted on six real-world datasets ( Epinions, Douban, Dianping, Yelp, Movielens (10M), and Netflix ). The results demonstrate that ALoMA outperforms the state-of-the-art LRMA-based methods and can easily provide interpretable recommendation results.", acknowledgement = ack-nhfb, articleno = "45", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Li:2019:NNN, author = "Xin Li and Dongcheng Han and Jing He and Lejian Liao and Mingzhong Wang", title = "Next and Next New {POI} Recommendation via Latent Behavior Pattern Inference", journal = j-TOIS, volume = "37", number = "4", pages = "46:1--46:??", month = dec, year = "2019", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3354187", ISSN = "1046-8188", bibdate = "Wed Dec 11 07:07:43 MST 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/ft_gateway.cfm?id=3354187", abstract = "Next and next new point-of-interest (POI) recommendation are essential instruments in promoting customer experiences and business operations related to locations. However, due to the sparsity of the check-in records, they still remain insufficiently studied. In this article, we propose to utilize personalized latent behavior patterns learned from contextual features, e.g., time of day, day of week, and location category, to improve the effectiveness of the recommendations. Two variations of models are developed, including GPDM, which learns a fixed pattern distribution for all users; and PPDM, which learns personalized pattern distribution for each user. In both models, a soft-max function is applied to integrate the personalized Markov chain with the latent patterns, and a sequential Bayesian Personalized Ranking (S-BPR) is applied as the optimization criterion. Then, Expectation Maximization (EM) is in charge of finding optimized model parameters. Extensive experiments on three large-scale commonly adopted real-world LBSN data sets prove that the inclusion of location category and latent patterns helps to boost the performance of POI recommendations. Specifically, our models in general significantly outperform other state-of-the-art methods for both next and next new POI recommendation tasks. Moreover, our models are capable of making accurate recommendations regardless of the short/long duration or distance.", acknowledgement = ack-nhfb, articleno = "46", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Du:2019:MED, author = "Xiaoyu Du and Xiangnan He and Fajie Yuan and Jinhui Tang and Zhiguang Qin and Tat-Seng Chua", title = "Modeling Embedding Dimension Correlations via Convolutional Neural Collaborative Filtering", journal = j-TOIS, volume = "37", number = "4", pages = "47:1--47:??", month = dec, year = "2019", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3357154", ISSN = "1046-8188", bibdate = "Wed Dec 11 07:07:43 MST 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/ft_gateway.cfm?id=3357154", abstract = "As the core of recommender systems, collaborative filtering (CF) models the affinity between a user and an item from historical user-item interactions, such as clicks, purchases, and so on. Benefiting from the strong representation power, neural networks have recently revolutionized the recommendation research, setting up a new standard for CF. However, existing neural recommender models do not explicitly consider the correlations among embedding dimensions, making them less effective in modeling the interaction function between users and items. In this work, we emphasize on modeling the correlations among embedding dimensions in neural networks to pursue higher effectiveness for CF. We propose a novel and general neural collaborative filtering framework-namely, ConvNCF, which is featured with two designs: (1) applying outer product on user embedding and item embedding to explicitly model the pairwise correlations between embedding dimensions, and (2) employing convolutional neural network above the outer product to learn the high-order correlations among embedding dimensions. To justify our proposal, we present three instantiations of ConvNCF by using different inputs to represent a user and conduct experiments on two real-world datasets. Extensive results verify the utility of modeling embedding dimension correlations with ConvNCF, which outperforms several competitive CF methods.", acknowledgement = ack-nhfb, articleno = "47", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Lin:2019:EPR, author = "Xiao Lin and Min Zhang and Yiqun Liu and Shaoping Ma", title = "Enhancing Personalized Recommendation by Implicit Preference Communities Modeling", journal = j-TOIS, volume = "37", number = "4", pages = "48:1--48:??", month = dec, year = "2019", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3352592", ISSN = "1046-8188", bibdate = "Wed Dec 11 07:07:43 MST 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/ft_gateway.cfm?id=3352592", abstract = "Recommender systems aim to capture user preferences and provide accurate recommendations to users accordingly. For each user, there usually exist others with similar preferences, and a collection of users may also have similar preferences with each other, thus forming a community. However, such communities may not necessarily be explicitly given, and the users inside the same communities may not know each other; they are formally defined and named Implicit Preference Communities (IPCs) in this article. By enriching user preferences with the information of other users in the communities, the performance of recommender systems can also be enhanced. Historical explicit ratings are a good resource to construct the IPCs of users but is usually sparse. Meanwhile, user preferences are easily affected by their social connections, which can be jointly used for IPC modeling with the ratings. However, this imposes two challenges for model design. First, the rating and social domains are heterogeneous; thus, it is challenging to coordinate social information and rating behaviors for a same learning task. Therefore, transfer learning is a good strategy for IPC modeling. Second, the communities are not explicitly labeled, and existing supervised learning approaches do not fit the requirement of IPC modeling. As co-clustering is an effective unsupervised learning approach for discovering block structures in high-dimensional data, it is a cornerstone for discovering the structure of IPCs. In this article, we propose a recommendation model with Implicit Preference Communities from user ratings and social connections. To tackle the unsupervised learning limitation, we design a Bayesian probabilistic graphical model to capture the IPC structure for recommendation. Meanwhile, following the spirit of transfer learning, both rating behaviors and social connections are introduced into the model by parameter sharing. Moreover, Gibbs sampling-based algorithms are proposed for parameter inferences of the models. Furthermore, to meet the need for online scenarios when the data arrive sequentially as a stream, a novel online sampling-based parameter inference algorithm for recommendation is proposed. To the best of our knowledge, this is the first attempt to propose and formally define the concept of IPC.", acknowledgement = ack-nhfb, articleno = "48", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{deRijke:2019:RAT, author = "Maarten de Rijke", title = "Reviewers for {{\booktitle{ACM Transactions on Information Systems}}} Volume 37", journal = j-TOIS, volume = "37", number = "4", pages = "49:1--49:??", month = dec, year = "2019", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3365367", ISSN = "1046-8188", bibdate = "Wed Dec 11 07:07:43 MST 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/ft_gateway.cfm?id=3365367", acknowledgement = ack-nhfb, articleno = "49", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Han:2020:GDR, author = "Jungkyu Han and Hayato Yamana", title = "Geographic Diversification of Recommended {POIs} in Frequently Visited Areas", journal = j-TOIS, volume = "38", number = "1", pages = "1:1--1:??", month = feb, year = "2020", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3362505", ISSN = "1046-8188", bibdate = "Wed Dec 11 07:07:43 MST 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/ft_gateway.cfm?id=3362505", abstract = "In the personalized Point-Of-Interest (POI) (or venue) recommendation, the diversity of recommended POIs is an important aspect. Diversity is especially important when POIs are recommended in the target users' frequently visited areas, because users are likely to revisit such areas. In addition to the (POI) category diversity that is a popular diversification objective in recommendation domains, diversification of recommended POI locations is an interesting subject itself. Despite its importance, existing POI recommender studies generally focus on and evaluate prediction accuracy. In this article, geographical diversification (geo-diversification), a novel diversification concept that aims to increase recommendation coverage for a target users' geographic areas of interest, is introduced, from which a method that improves geo-diversity as an addition to existing state-of-the-art POI recommenders is proposed. In experiments with the datasets from two real Location Based Social Networks (LSBNs), we first analyze the performance of four state-of-the-art POI recommenders from various evaluation perspectives including category diversity and geo-diversity that have not been examined previously. The proposed method consistently improves geo-diversity (CPR(geo)@20) by 5 to 12\% when combined with four state-of-the-art POI recommenders with negligible prediction accuracy (Recall@20) loss and provides 6 to 18\% geo-diversity improvement with tolerable prediction accuracy loss (up to 2.4\%).", acknowledgement = ack-nhfb, articleno = "1", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Zhang:2020:UAC, author = "Xiaoying Zhang and Hong Xie and Junzhou Zhao and John C. S. Lui", title = "Understanding Assimilation-contrast Effects in Online Rating Systems: Modelling, Debiasing, and Applications", journal = j-TOIS, volume = "38", number = "1", pages = "2:1--2:??", month = feb, year = "2020", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3362651", ISSN = "1046-8188", bibdate = "Wed Dec 11 07:07:43 MST 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/ft_gateway.cfm?id=3362651", abstract = "``Unbiasedness,'' which is an important property to ensure that users' ratings indeed reflect their true evaluations of products, is vital both in shaping consumer purchase decisions and providing reliable recommendations in online rating systems. Recent experimental studies showed that distortions from historical ratings would ruin the unbiasedness of subsequent ratings. How to ``discover'' historical distortions in each single rating (or at the micro-level), and perform the ``debiasing operations'' are our main objective. Using 42M real customer ratings, we first show that users either ``assimilate'' or ``contrast'' to historical ratings under different scenarios, which can be further explained by a well-known psychological argument: the ``Assimilate-Contrast'' theory. This motivates us to propose the Historical Influence Aware Latent Factor Model (HIALF), the ``first'' model for real rating systems to capture and mitigate historical distortions in each single rating. HIALF allows us to study the influence patterns of historical ratings from a modelling perspective, which perfectly matches the assimilation and contrast effects observed in experiments. Moreover, HIALF achieves significant improvements in predicting subsequent ratings and characterizing relationships in ratings. It also contributes to better recommendations, wiser consumer purchase decisions, and deeper understanding of historical distortions in both honest rating and misbehaving rating settings.", acknowledgement = ack-nhfb, articleno = "2", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Lv:2020:BAR, author = "Pengtao Lv and Xiangwu Meng and Yujie Zhang", title = "{BoRe}: Adapting to Reader Consumption Behavior Instability for News Recommendation", journal = j-TOIS, volume = "38", number = "1", pages = "3:1--3:??", month = feb, year = "2020", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3361217", ISSN = "1046-8188", bibdate = "Wed Dec 11 07:07:43 MST 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/ft_gateway.cfm?id=3361217", abstract = "News recommendation has become an essential way to help readers discover interesting stories. While a growing line of research has focused on modeling reading preferences for news recommendation, they neglect the instability of reader consumption behaviors, i.e., consumption behaviors of readers may be influenced by other factors in addition to user interests, which degrades the recommendation effectiveness of existing methods. In this article, we propose a probabilistic generative model, BoRe, where user interests and crowd effects are used to adapt to the instability of reader consumption behaviors, and reading sequences are utilized to adapt user interests evolving over time. Further, the extreme sparsity problem in the domain of news severely hinders accurately modeling user interests and reading sequences, which discounts BoRe's ability to adapt to the instability. Accordingly, we leverage domain-specific features to model user interests in the situation of extreme sparsity. Meanwhile, we consider groups of users instead of individuals to capture reading sequences. Besides, we study how to reduce the computation to allow online application. Extensive experiments have been conducted to evaluate the effectiveness and efficiency of BoRe on real-world datasets. The experimental results show the superiority of BoRe, compared with the state-of-the-art competing methods.", acknowledgement = ack-nhfb, articleno = "3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Ai:2020:EPS, author = "Qingyao Ai and Yongfeng Zhang and Keping Bi and W. Bruce Croft", title = "Explainable Product Search with a Dynamic Relation Embedding Model", journal = j-TOIS, volume = "38", number = "1", pages = "4:1--4:??", month = feb, year = "2020", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3361738", ISSN = "1046-8188", bibdate = "Wed Dec 11 07:07:43 MST 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/ft_gateway.cfm?id=3361738", abstract = "Product search is one of the most popular methods for customers to discover products online. Most existing studies on product search focus on developing effective retrieval models that rank items by their likelihood to be purchased. However, they ignore the problem that there is a gap between how systems and customers perceive the relevance of items. Without explanations, users may not understand why product search engines retrieve certain items for them, which consequentially leads to imperfect user experience and suboptimal system performance in practice. In this work, we tackle this problem by constructing explainable retrieval models for product search. Specifically, we propose to model the ``search and purchase'' behavior as a dynamic relation between users and items, and create a dynamic knowledge graph based on both the multi-relational product data and the context of the search session. Ranking is conducted based on the relationship between users and items in the latent space, and explanations are generated with logic inferences and entity soft matching on the knowledge graph. Empirical experiments show that our model, which we refer to as the Dynamic Relation Embedding Model (DREM), significantly outperforms the state-of-the-art baselines and has the ability to produce reasonable explanations for search results.", acknowledgement = ack-nhfb, articleno = "4", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Zhang:2020:MLC, author = "Dong Zhang and Shu Zhao and Zhen Duan and Jie Chen and Yanping Zhang and Jie Tang", title = "A Multi-Label Classification Method Using a Hierarchical and Transparent Representation for Paper-Reviewer Recommendation", journal = j-TOIS, volume = "38", number = "1", pages = "5:1--5:20", month = feb, year = "2020", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3361719", ISSN = "1046-8188", bibdate = "Thu Mar 19 10:56:24 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/abs/10.1145/3361719", abstract = "The paper-reviewer recommendation task is of significant academic importance for conference chairs and journal editors. It aims to recommend appropriate experts in a discipline to comment on the quality of papers of others in that discipline. How to \ldots{}", acknowledgement = ack-nhfb, articleno = "5", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Ahmad:2020:DLA, author = "Faizan Ahmad and Ahmed Abbasi and Jingjing Li and David G. Dobolyi and Richard G. Netemeyer and Gari D. Clifford and Hsinchun Chen", title = "A Deep Learning Architecture for Psychometric Natural Language Processing", journal = j-TOIS, volume = "38", number = "1", pages = "6:1--6:29", month = feb, year = "2020", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3365211", ISSN = "1046-8188", bibdate = "Thu Mar 19 10:56:24 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/abs/10.1145/3365211", abstract = "Psychometric measures reflecting people's knowledge, ability, attitudes, and personality traits are critical for many real-world applications, such as e-commerce, health care, and cybersecurity. However, traditional methods cannot collect and measure \ldots{}", acknowledgement = ack-nhfb, articleno = "6", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zeng:2020:NIR, author = "Zijie Zeng and Jing Lin and Lin Li and Weike Pan and Zhong Ming", title = "Next-Item Recommendation via Collaborative Filtering with Bidirectional Item Similarity", journal = j-TOIS, volume = "38", number = "1", pages = "7:1--7:22", month = feb, year = "2020", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3366172", ISSN = "1046-8188", bibdate = "Thu Mar 19 10:56:24 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/abs/10.1145/3366172", abstract = "Exploiting temporal effect has empirically been recognized as a promising way to improve recommendation performance in recent years. In real-world applications, one-class data in the form of (user, item, timestamp) are usually more accessible and \ldots{}", acknowledgement = ack-nhfb, articleno = "7", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Sun:2020:ECG, author = "Xiao Sun and Jia Li and Xing Wei and Changliang Li and Jianhua Tao", title = "Emotional Conversation Generation Based on a {Bayesian} Deep Neural Network", journal = j-TOIS, volume = "38", number = "1", pages = "8:1--8:24", month = feb, year = "2020", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3368960", ISSN = "1046-8188", bibdate = "Wed Dec 11 07:07:43 MST 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The field of conversation generation using neural networks has attracted increasing attention from researchers for several years. However, traditional neural language models tend to generate a generic reply with poor semantic logic and no emotion. This article proposes an emotional conversation generation model based on a Bayesian deep neural network that can generate replies with rich emotions, clear themes, and diverse sentences. The topic and emotional keywords of the replies are pregenerated by introducing commonsense knowledge in the model. The reply is divided into multiple clauses, and then a multidimensional generator based on the transformer mechanism proposed in this article is used to iteratively generate clauses from two dimensions: sentence granularity and sentence structure. Subjective and objective experiments prove that compared with existing models, the proposed model effectively improves the semantic logic and emotional accuracy of replies. This model also significantly enhances the diversity of replies, largely overcoming the shortcomings of traditional models that generate safe replies.", acknowledgement = ack-nhfb, articleno = "8", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "http://portal.acm.org/browse_dl.cfm?idx=J779", } @Article{Choi:2020:ETC, author = "Bogeum Choi and Austin Ward and Yuan Li and Jaime Arguello and Robert Capra", title = "The Effects of Task Complexity on the Use of Different Types of Information in a Search Assistance Tool", journal = j-TOIS, volume = "38", number = "1", pages = "9:1--9:28", month = feb, year = "2020", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3371707", ISSN = "1046-8188", bibdate = "Mon Feb 10 12:32:39 MST 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/abs/10.1145/3371707", abstract = "In interactive information retrieval, an important research question is: How do task characteristics influence users' needs and behaviors? We report on a laboratory study $(N = 32)$ that investigated the effects of task complexity on the types of \ldots{}", acknowledgement = ack-nhfb, articleno = "9", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Thomas:2020:ISM, author = "Paul Thomas and Bodo Billerbeck and Nick Craswell and Ryen W. White", title = "Investigating Searchers' Mental Models to Inform Search Explanations", journal = j-TOIS, volume = "38", number = "1", pages = "10:1--10:25", month = feb, year = "2020", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3371390", ISSN = "1046-8188", bibdate = "Mon Feb 10 12:32:39 MST 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/abs/10.1145/3371390", abstract = "Modern web search engines use many signals to select and rank results in response to queries. However, searchers' mental models of search are relatively unsophisticated, hindering their ability to use search engines efficiently and effectively. \ldots{}", acknowledgement = ack-nhfb, articleno = "10", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Ding:2020:IIR, author = "Jingtao Ding and Guanghui Yu and Yong Li and Xiangnan He and Depeng Jin", title = "Improving Implicit Recommender Systems with Auxiliary Data", journal = j-TOIS, volume = "38", number = "1", pages = "11:1--11:27", month = feb, year = "2020", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3372338", ISSN = "1046-8188", bibdate = "Mon Feb 10 12:32:39 MST 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/abs/10.1145/3372338", abstract = "Most existing recommender systems leverage the primary feedback only, despite the fact that users also generate a large amount of auxiliary feedback. These feedback usually indicate different user preferences when comparing to the primary feedback \ldots{}", acknowledgement = ack-nhfb, articleno = "11", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Chen:2020:LVF, author = "Yifan Chen and Yang Wang and Xiang Zhao and Hongzhi Yin and Ilya Markov and Maarten De Rijke", title = "Local Variational Feature-Based Similarity Models for Recommending Top-{$N$} New Items", journal = j-TOIS, volume = "38", number = "2", pages = "12:1--12:33", month = mar, year = "2020", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3372154", ISSN = "1046-8188", bibdate = "Thu Mar 19 10:51:00 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/abs/10.1145/3372154", abstract = "The top-$N$ recommendation problem has been studied extensively. Item-based collaborative filtering recommendation algorithms show promising results for the problem. They predict a user's preferences by estimating similarities between a target and user-\ldots{}", acknowledgement = ack-nhfb, articleno = "12", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Arapakis:2020:PPA, author = "Ioannis Arapakis and Antonio Penta and Hideo Joho and Luis A. Leiva", title = "A Price-per-attention Auction Scheme Using Mouse Cursor Information", journal = j-TOIS, volume = "38", number = "2", pages = "13:1--13:30", month = jan, year = "2020", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3374210", ISSN = "1046-8188", bibdate = "Mon Feb 10 12:32:40 MST 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/abs/10.1145/3374210", abstract = "Payments in online ad auctions are typically derived from click-through rates, so that advertisers do not pay for ineffective ads. But advertisers often care about more than just clicks. That is, for example, if they aim to raise brand awareness or \ldots{}", acknowledgement = ack-nhfb, articleno = "13", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Chen:2020:ENM, author = "Chong Chen and Min Zhang and Yongfeng Zhang and Yiqun Liu and Shaoping Ma", title = "Efficient Neural Matrix Factorization without Sampling for Recommendation", journal = j-TOIS, volume = "38", number = "2", pages = "14:1--14:28", month = jan, year = "2020", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3373807", ISSN = "1046-8188", bibdate = "Mon Feb 10 12:32:40 MST 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/abs/10.1145/3373807", abstract = "Recommendation systems play a vital role to keep users engaged with personalized contents in modern online platforms. Recently, deep learning has revolutionized many research fields and there is a surge of interest in applying it for recommendation. \ldots{}", acknowledgement = ack-nhfb, articleno = "14", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Qin:2020:ENN, author = "Chuan Qin and Hengshu Zhu and Tong Xu and Chen Zhu and Chao Ma and Enhong Chen and Hui Xiong", title = "An Enhanced Neural Network Approach to Person-Job Fit in Talent Recruitment", journal = j-TOIS, volume = "38", number = "2", pages = "15:1--15:33", month = mar, year = "2020", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3376927", ISSN = "1046-8188", bibdate = "Thu Mar 19 10:51:00 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/abs/10.1145/3376927", abstract = "The widespread use of online recruitment services has led to an information explosion in the job market. As a result, recruiters have to seek intelligent ways for Person-Job Fit, which is the bridge for adapting the right candidates to the right \ldots{}", acknowledgement = ack-nhfb, articleno = "15", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Meng:2020:JLR, author = "Zaiqiao Meng and Shangsong Liang and Xiangliang Zhang and Richard McCreadie and Iadh Ounis", title = "Jointly Learning Representations of Nodes and Attributes for Attributed Networks", journal = j-TOIS, volume = "38", number = "2", pages = "16:1--16:32", month = jan, year = "2020", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3377850", ISSN = "1046-8188", bibdate = "Mon Feb 10 12:32:40 MST 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/abs/10.1145/3377850", abstract = "Previous embedding methods for attributed networks aim at learning low-dimensional vector representations only for nodes but not for both nodes and attributes, resulting in the fact that node embeddings cannot be directly used to recover the \ldots{}", acknowledgement = ack-nhfb, articleno = "16", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhao:2020:LSR, author = "Wayne Xin Zhao and Yupeng Hou and Junhua Chen and Jonathan J. H. Zhu and Eddy Jing Yin and Hanting Su and Ji-Rong Wen", title = "Learning Semantic Representations from Directed Social Links to Tag Microblog Users at Scale", journal = j-TOIS, volume = "38", number = "2", pages = "17:1--17:30", month = mar, year = "2020", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3377550", ISSN = "1046-8188", bibdate = "Thu Mar 19 10:51:00 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/abs/10.1145/3377550", abstract = "This article presents a network embedding approach to automatically generate tags for microblog users. Instead of using text data, we aim to annotate microblog users with meaningful tags by leveraging rich social link data. To utilize directed social \ldots{}", acknowledgement = ack-nhfb, articleno = "17", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Naskar:2020:EDP, author = "Debashis Naskar and Sanasam Ranbir Singh and Durgesh Kumar and Sukumar Nandi and Eva Onaindia de la Rivaherrera", title = "Emotion Dynamics of Public Opinions on {Twitter}", journal = j-TOIS, volume = "38", number = "2", pages = "18:1--18:24", month = mar, year = "2020", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3379340", ISSN = "1046-8188", bibdate = "Thu Mar 19 10:51:00 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/abs/10.1145/3379340", abstract = "Recently, social media has been considered the fastest medium for information broadcasting and sharing. Considering the wide range of applications such as viral marketing, political campaigns, social advertisement, and so on, influencing characteristics \ldots{}", acknowledgement = ack-nhfb, articleno = "18", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Huang:2020:LFD, author = "Zhenya Huang and Qi Liu and Yuying Chen and Le Wu and Keli Xiao and Enhong Chen and Haiping Ma and Guoping Hu", title = "Learning or Forgetting? {A} Dynamic Approach for Tracking the Knowledge Proficiency of Students", journal = j-TOIS, volume = "38", number = "2", pages = "19:1--19:33", month = mar, year = "2020", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3379507", ISSN = "1046-8188", bibdate = "Thu Mar 19 10:51:00 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/abs/10.1145/3379507", abstract = "The rapid development of the technologies for online learning provides students with extensive resources for self-learning and brings new opportunities for data-driven research on educational management. An important issue of online learning is to \ldots{}", acknowledgement = ack-nhfb, articleno = "19", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Nie:2020:LSQ, author = "Liqiang Nie and Yongqi Li and Fuli Feng and Xuemeng Song and Meng Wang and Yinglong Wang", title = "Large-Scale Question Tagging via Joint Question-Topic Embedding Learning", journal = j-TOIS, volume = "38", number = "2", pages = "20:1--20:23", month = mar, year = "2020", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3380954", ISSN = "1046-8188", bibdate = "Thu Mar 19 10:51:00 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/abs/10.1145/3380954", abstract = "Recent years have witnessed a flourishing of community-driven question answering (cQA), like Yahoo! Answers and AnswerBag, where people can seek precise information. After 2010, some novel cQA systems, including Quora and Zhihu, gained momentum. Besides \ldots{}", acknowledgement = ack-nhfb, articleno = "20", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Huang:2020:CBI, author = "Minlie Huang and Xiaoyan Zhu and Jianfeng Gao", title = "Challenges in Building Intelligent Open-domain Dialog Systems", journal = j-TOIS, volume = "38", number = "3", pages = "21:1--21:32", month = jun, year = "2020", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3383123", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jun 27 14:50:14 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/abs/10.1145/3383123", abstract = "There is a resurgent interest in developing intelligent open-domain dialog systems due to the availability of large amounts of conversational data and the recent progress on neural approaches to conversational AI [33]. Unlike traditional task-oriented \ldots{}", acknowledgement = ack-nhfb, articleno = "21", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Qiu:2020:ECS, author = "Ruihong Qiu and Zi Huang and Jingjing Li and Hongzhi Yin", title = "Exploiting Cross-session Information for Session-based Recommendation with Graph Neural Networks", journal = j-TOIS, volume = "38", number = "3", pages = "22:1--22:23", month = jun, year = "2020", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3382764", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jun 27 14:50:14 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/abs/10.1145/3382764", abstract = "Different from the traditional recommender system, the session-based recommender system introduces the concept of the session, i.e., a sequence of interactions between a user and multiple items within a period, to preserve the user's recent interest. \ldots{}", acknowledgement = ack-nhfb, articleno = "22", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{deOliveira:2020:OSA, author = "Wyverson Bonasoli de Oliveira and Leyza Baldo Dorini and Rodrigo Minetto and Thiago H. Silva", title = "{OutdoorSent}: Sentiment Analysis of Urban Outdoor Images by Using Semantic and Deep Features", journal = j-TOIS, volume = "38", number = "3", pages = "23:1--23:28", month = jun, year = "2020", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3385186", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jun 27 14:50:14 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/abs/10.1145/3385186", abstract = "Opinion mining in outdoor images posted by users during different activities can provide valuable information to better understand urban areas. In this regard, we propose a framework to classify the sentiment of outdoor images shared by users on social \ldots{}", acknowledgement = ack-nhfb, articleno = "23", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Jagerman:2020:SEO, author = "Rolf Jagerman and Ilya Markov and Maarten {De Rijke}", title = "Safe Exploration for Optimizing Contextual Bandits", journal = j-TOIS, volume = "38", number = "3", pages = "24:1--24:23", month = jun, year = "2020", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3385670", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jun 27 14:50:14 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/abs/10.1145/3385670", abstract = "Contextual bandit problems are a natural fit for many information retrieval tasks, such as learning to rank, text classification, recommendation, and so on. However, existing learning methods for contextual bandit problems have one of two drawbacks: \ldots{}", acknowledgement = ack-nhfb, articleno = "24", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Liu:2020:FDN, author = "Yang Liu and Yi-Fang Brook Wu", title = "{FNED}: a Deep Network for Fake News Early Detection on Social Media", journal = j-TOIS, volume = "38", number = "3", pages = "25:1--25:33", month = jun, year = "2020", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3386253", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jun 27 14:50:14 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/abs/10.1145/3386253", abstract = "The fast spreading of fake news stories on social media can cause inestimable social harm. Developing effective methods to detect them early is of paramount importance. A major challenge of fake news early detection is fully utilizing the limited data \ldots{}", acknowledgement = ack-nhfb, articleno = "25", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Alserafi:2020:KDL, author = "Ayman Alserafi and Alberto Abell{\'o} and Oscar Romero and Toon Calders", title = "Keeping the Data Lake in Form: Proximity Mining for Pre-Filtering Schema Matching", journal = j-TOIS, volume = "38", number = "3", pages = "26:1--26:30", month = jun, year = "2020", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3388870", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jun 27 14:50:14 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/abs/10.1145/3388870", abstract = "Data lakes (DLs) are large repositories of raw datasets from disparate sources. As more datasets are ingested into a DL, there is an increasing need for efficient techniques to profile them and to detect the relationships among their schemata, commonly \ldots{}", acknowledgement = ack-nhfb, articleno = "26", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zou:2020:TQB, author = "Jie Zou and Evangelos Kanoulas", title = "Towards Question-based High-recall Information Retrieval: Locating the Last Few Relevant Documents for Technology-assisted Reviews", journal = j-TOIS, volume = "38", number = "3", pages = "27:1--27:35", month = jun, year = "2020", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3388640", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jun 27 14:50:14 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/abs/10.1145/3388640", abstract = "While continuous active learning algorithms have proven effective in finding most of the relevant documents in a collection, the cost for locating the last few remains high for applications such as Technology-assisted Reviews (TAR). To locate these last \ldots{}", acknowledgement = ack-nhfb, articleno = "27", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Huang:2020:NHN, author = "Jie Huang and Chuan Chen and Fanghua Ye and Weibo Hu and Zibin Zheng", title = "Nonuniform Hyper-Network Embedding with Dual Mechanism", journal = j-TOIS, volume = "38", number = "3", pages = "28:1--28:18", month = jun, year = "2020", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3388924", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jun 27 14:50:14 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/abs/10.1145/3388924", abstract = "Network embedding which aims to learn the low-dimensional representations for vertices in networks has been extensively studied in recent years. Although there are various models designed for networks with different properties and different structures \ldots{}", acknowledgement = ack-nhfb, articleno = "28", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Tonellotto:2020:UII, author = "Nicola Tonellotto and Craig Macdonald", title = "Using an Inverted Index Synopsis for Query Latency and Performance Prediction", journal = j-TOIS, volume = "38", number = "3", pages = "29:1--29:33", month = jun, year = "2020", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3389795", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jun 27 14:50:14 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/abs/10.1145/3389795", abstract = "Predicting the query latency by a search engine has important benefits, for instance, in allowing the search engine to adjust its configuration to address long-running queries without unnecessarily sacrificing its effectiveness. However, for the dynamic \ldots{}", acknowledgement = ack-nhfb, articleno = "29", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Cheng:2020:RUC, author = "Miaomiao Cheng and Liping Jing and Michael K. Ng", title = "Robust Unsupervised Cross-modal Hashing for Multimedia Retrieval", journal = j-TOIS, volume = "38", number = "3", pages = "30:1--30:25", month = jun, year = "2020", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3389547", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jun 27 14:50:14 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/hash.bib; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/abs/10.1145/3389547", abstract = "With the quick development of social websites, there are more opportunities to have different media types (such as text, image, video, etc.) describing the same topic from large-scale heterogeneous data sources. To efficiently identify the inter-media correlations for multimedia retrieval, unsupervised cross-modal hashing (UCMH) has gained increased interest due to the significant reduction in computation and storage. However, most UCMH methods assume that the data from different modalities are well paired. As a result, existing UCMH methods may not achieve satisfactory performance when partially paired data are given only. In this article, we propose a new-type of UCMH method called robust unsupervised cross-modal hashing (RUCMH). The major contribution lies in jointly learning modal-specific hash function, exploring the correlations among modalities with partial or even without any pairwise correspondence, and preserving the information of original features as much as possible. The learning process can be modeled via a joint minimization problem, and the corresponding optimization algorithm is presented. A series of experiments is conducted on four real-world datasets (Wiki, MIRFlickr, NUS-WIDE, and MS-COCO). The results demonstrate that RUCMH can significantly outperform the state-of-the-art unsupervised cross-modal hashing methods, especially for the partially paired case, which validates the effectiveness of RUCMH.", acknowledgement = ack-nhfb, articleno = "30", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2020:DFG, author = "Ruqing Zhang and Jiafeng Guo and Yixing Fan and Yanyan Lan and Xueqi Cheng", title = "Dual-factor Generation Model for Conversation", journal = j-TOIS, volume = "38", number = "3", pages = "31:1--31:31", month = jun, year = "2020", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3394052", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jun 27 14:50:14 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/abs/10.1145/3394052", abstract = "The conversation task is usually formulated as a conditional generation problem, i.e., to generate a natural and meaningful response given the input utterance. Generally speaking, this formulation is apparently based on an oversimplified assumption that \ldots{}", acknowledgement = ack-nhfb, articleno = "31", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Lin:2020:EEB, author = "Hao Lin and Hengshu Zhu and Junjie Wu and Yuan Zuo and Chen Zhu and Hui Xiong", title = "Enhancing Employer Brand Evaluation with Collaborative Topic Regression Models", journal = j-TOIS, volume = "38", number = "4", pages = "32:1--32:33", month = oct, year = "2020", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3392734", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Oct 14 06:47:18 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3392734", abstract = "Employer Brand Evaluation (EBE) is to understand an employer's unique characteristics to identify competitive edges. Traditional approaches rely heavily on employers' financial information, including financial reports and filings submitted to the \ldots{}", acknowledgement = ack-nhfb, articleno = "32", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Moffat:2020:LAS, author = "Alistair Moffat and Matthias Petri", title = "Large-Alphabet Semi-Static Entropy Coding Via Asymmetric Numeral Systems", journal = j-TOIS, volume = "38", number = "4", pages = "33:1--33:33", month = oct, year = "2020", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3397175", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Oct 14 06:47:18 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3397175", abstract = "An entropy coder takes as input a sequence of symbol identifiers over some specified alphabet and represents that sequence as a bitstring using as few bits as possible, typically assuming that the elements of the sequence are independent of each other. \ldots{}", acknowledgement = ack-nhfb, articleno = "33", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Ren:2020:CCR, author = "Xuhui Ren and Hongzhi Yin and Tong Chen and Hao Wang and Nguyen Quoc Viet Hung and Zi Huang and Xiangliang Zhang", title = "{CRSAL}: Conversational Recommender Systems with Adversarial Learning", journal = j-TOIS, volume = "38", number = "4", pages = "34:1--34:40", month = oct, year = "2020", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3394592", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Oct 14 06:47:18 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3394592", abstract = "Recommender systems have been attracting much attention from both academia and industry because of their ability to capture user interests and generate personalized item recommendations. As the life pace in contemporary society speeds up, traditional \ldots{}", acknowledgement = ack-nhfb, articleno = "34", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Chen:2020:SHO, author = "Xiancong Chen and Lin Li and Weike Pan and Zhong Ming", title = "A Survey on Heterogeneous One-class Collaborative Filtering", journal = j-TOIS, volume = "38", number = "4", pages = "35:1--35:54", month = oct, year = "2020", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3402521", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Oct 14 06:47:18 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3402521", abstract = "Recommender systems play an important role in providing personalized services for users in the context of information overload. Generally, users' feedback toward items often contain the most significant information reflecting their preferences, which \ldots{}", acknowledgement = ack-nhfb, articleno = "35", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2020:PLP, author = "Richong Zhang and Samuel Mensah and Fanshuang Kong and Zhiyuan Hu and Yongyi Mao and Xudong Liu", title = "Pairwise Link Prediction Model for Out of Vocabulary Knowledge Base Entities", journal = j-TOIS, volume = "38", number = "4", pages = "36:1--36:28", month = oct, year = "2020", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3406116", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Oct 14 06:47:18 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3406116", abstract = "Real-world knowledge bases such as DBPedia, Yago, and Freebase contain sparse linkage connectivity, which poses a severe challenge to link prediction between entities. To cope with such data scarcity issues, recent models have focused on learning \ldots{}", acknowledgement = ack-nhfb, articleno = "36", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Chen:2020:FGP, author = "Xiaolin Chen and Xuemeng Song and Ruiyang Ren and Lei Zhu and Zhiyong Cheng and Liqiang Nie", title = "Fine-Grained Privacy Detection with Graph-Regularized Hierarchical Attentive Representation Learning", journal = j-TOIS, volume = "38", number = "4", pages = "37:1--37:26", month = oct, year = "2020", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3406109", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Oct 14 06:47:18 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3406109", abstract = "Due to the complex and dynamic environment of social media, user generated contents (UGCs) may inadvertently leak users' personal aspects, such as the personal attributes, relationships and even the health condition, and thus place users at high privacy \ldots{}", acknowledgement = ack-nhfb, articleno = "37", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Agosti:2020:LUK, author = "Maristella Agosti and Stefano Marchesin and Gianmaria Silvello", title = "Learning Unsupervised Knowledge-Enhanced Representations to Reduce the Semantic Gap in Information Retrieval", journal = j-TOIS, volume = "38", number = "4", pages = "38:1--38:48", month = oct, year = "2020", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3417996", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Oct 14 06:47:18 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3417996", abstract = "The semantic mismatch between query and document terms-i.e., the semantic gap-is a long-standing problem in Information Retrieval (IR). Two main linguistic features related to the semantic gap that can be exploited to improve retrieval are synonymy and \ldots{}", acknowledgement = ack-nhfb, articleno = "38", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Kim:2020:ETM, author = "Youngwoo Kim and Myungha Jang and James Allan", title = "Explaining Text Matching on Neural Natural Language Inference", journal = j-TOIS, volume = "38", number = "4", pages = "39:1--39:23", month = oct, year = "2020", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3418052", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Oct 14 06:47:18 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3418052", abstract = "Natural language inference (NLI) is the task of detecting the existence of entailment or contradiction in a given sentence pair. Although NLI techniques could help numerous information retrieval tasks, most solutions for NLI are neural approaches whose \ldots{}", acknowledgement = ack-nhfb, articleno = "39", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Li:2020:MME, author = "Chang Li and Ilya Markov and Maarten {De Rijke} and Masrour Zoghi", title = "{MergeDTS}: a Method for Effective Large-Scale Online Ranker Evaluation", journal = j-TOIS, volume = "38", number = "4", pages = "40:1--40:28", month = oct, year = "2020", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3411753", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Oct 14 06:47:18 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3411753", abstract = "Online ranker evaluation is one of the key challenges in information retrieval. Although the preferences of rankers can be inferred by interleaving methods, the problem of how to effectively choose the ranker pair that generates the interleaved list \ldots{}", acknowledgement = ack-nhfb, articleno = "40", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Li:2020:WSR, author = "Dan Li and Evangelos Kanoulas", title = "When to Stop Reviewing in Technology-Assisted Reviews: Sampling from an Adaptive Distribution to Estimate Residual Relevant Documents", journal = j-TOIS, volume = "38", number = "4", pages = "41:1--41:36", month = oct, year = "2020", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3411755", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Oct 14 06:47:18 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3411755", abstract = "Technology-Assisted Reviews (TAR) aim to expedite document reviewing (e.g., medical articles or legal documents) by iteratively incorporating machine learning algorithms and human feedback on document relevance. Continuous Active Learning (CAL) \ldots{}", acknowledgement = ack-nhfb, articleno = "41", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Chen:2020:BAI, author = "Yifan Chen and Yang Wang and Xiang Zhao and Jie Zou and Maarten {De Rijke}", title = "Block-Aware Item Similarity Models for Top-{$N$} Recommendation", journal = j-TOIS, volume = "38", number = "4", pages = "42:1--42:26", month = oct, year = "2020", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3411754", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Oct 14 06:47:18 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3411754", abstract = "Top- N recommendations have been studied extensively. Promising results have been achieved by recent item-based collaborative filtering (ICF) methods. The key to ICF lies in the estimation of item similarities. Observing the block-diagonal structure of \ldots{}", acknowledgement = ack-nhfb, articleno = "42", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhao:2021:PES, author = "Guangzhen Zhao and Peng Yang", title = "Pretrained Embeddings for Stance Detection with Hierarchical Capsule Network on Social Media", journal = j-TOIS, volume = "39", number = "1", pages = "1:1--1:32", month = jan, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3412362", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sun Mar 28 09:55:32 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3412362", abstract = "Stance detection on social media aims to identify the stance of social media users toward a topic or claim, which can provide powerful information for various downstream tasks. Many existing stance detection approaches neglect to model the deep semantic \ldots{}", acknowledgement = ack-nhfb, articleno = "1", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2021:GBR, author = "Yuan Zhang and Fei Sun and Xiaoyong Yang and Chen Xu and Wenwu Ou and Yan Zhang", title = "Graph-based Regularization on Embedding Layers for Recommendation", journal = j-TOIS, volume = "39", number = "1", pages = "2:1--2:27", month = jan, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3414067", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sun Mar 28 09:55:32 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3414067", abstract = "Neural networks have been extensively used in recommender systems. Embedding layers are not only necessary but also crucial for neural models in recommendation as a typical discrete task. In this article, we argue that the widely used $l_2$ regularization \ldots{}", acknowledgement = ack-nhfb, articleno = "2", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Mousset:2021:EEN, author = "Paul Mousset and Yoann Pitarch and Lynda Tamine", title = "End-to-End Neural Matching for Semantic Location Prediction of Tweets", journal = j-TOIS, volume = "39", number = "1", pages = "3:1--3:35", month = jan, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3415149", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sun Mar 28 09:55:32 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3415149", abstract = "The impressive increasing availability of social media posts has given rise to considerable research challenges. This article is concerned with the problem of semantic location prediction of geotagged tweets. The underlying task is to associate to a \ldots{}", acknowledgement = ack-nhfb, articleno = "3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Mcdonald:2021:HAC, author = "Graham Mcdonald and Craig Macdonald and Iadh Ounis", title = "How the Accuracy and Confidence of Sensitivity Classification Affects Digital Sensitivity Review", journal = j-TOIS, volume = "39", number = "1", pages = "4:1--4:34", month = jan, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3417334", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sun Mar 28 09:55:32 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3417334", abstract = "Government documents must be manually reviewed to identify any sensitive information, e.g., confidential information, before being publicly archived. However, human-only sensitivity review is not practical for born-digital documents due to, for example, \ldots{}", acknowledgement = ack-nhfb, articleno = "4", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Mendoza:2021:BSI, author = "Marcelo Mendoza and Maurizio Tesconi and Stefano Cresci", title = "Bots in Social and Interaction Networks: Detection and Impact Estimation", journal = j-TOIS, volume = "39", number = "1", pages = "5:1--5:32", month = jan, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3419369", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sun Mar 28 09:55:32 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3419369", abstract = "The rise of bots and their influence on social networks is a hot topic that has aroused the interest of many researchers. Despite the efforts to detect social bots, it is still difficult to distinguish them from legitimate users. Here, we propose a \ldots{}", acknowledgement = ack-nhfb, articleno = "5", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Liu:2021:ABD, author = "Bulou Liu and Chenliang Li and Wei Zhou and Feng Ji and Yu Duan and Haiqing Chen", title = "An Attention-based Deep Relevance Model for Few-shot Document Filtering", journal = j-TOIS, volume = "39", number = "1", pages = "6:1--6:35", month = jan, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3419972", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sun Mar 28 09:55:32 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3419972", abstract = "With the large quantity of textual information produced on the Internet, a critical necessity is to filter out the irrelevant information and organize the rest into categories of interest (e.g., an emerging event). However, supervised-learning document \ldots{}", acknowledgement = ack-nhfb, articleno = "6", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Lan:2021:PNA, author = "Tian Lan and Xian-Ling Mao and Wei Wei and Xiaoyan Gao and Heyan Huang", title = "{PONE}: a Novel Automatic Evaluation Metric for Open-domain Generative Dialogue Systems", journal = j-TOIS, volume = "39", number = "1", pages = "7:1--7:37", month = jan, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3423168", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sun Mar 28 09:55:32 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3423168", abstract = "Open-domain generative dialogue systems have attracted considerable attention over the past few years. Currently, how to automatically evaluate them is still a big challenge. As far as we know, there are three kinds of automatic evaluations for open-\ldots{}", acknowledgement = ack-nhfb, articleno = "7", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Chen:2021:NFA, author = "Xu Chen and Kun Xiong and Yongfeng Zhang and Long Xia and Dawei Yin and Jimmy Xiangji Huang", title = "Neural Feature-aware Recommendation with Signed Hypergraph Convolutional Network", journal = j-TOIS, volume = "39", number = "1", pages = "8:1--8:22", month = jan, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3423322", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sun Mar 28 09:55:32 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3423322", abstract = "Understanding user preference is of key importance for an effective recommender system. For comprehensive user profiling, many efforts have been devoted to extract user feature-level preference from the review information. Despite effectiveness, \ldots{}", acknowledgement = ack-nhfb, articleno = "8", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Manioudakis:2021:FSO, author = "Kostas Manioudakis and Yannis Tzitzikas", title = "Faceted Search with Object Ranking and Answer Size Constraints", journal = j-TOIS, volume = "39", number = "1", pages = "9:1--9:33", month = jan, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3425603", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sun Mar 28 09:55:32 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3425603", abstract = "Faceted Search is a widely used interaction scheme in digital libraries, e-commerce, and recently also in Linked Data. Surprisingly, object ranking in the context of Faceted Search is not well studied in the literature. In this article, we propose an \ldots{}", acknowledgement = ack-nhfb, articleno = "9", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Fang:2021:DLS, author = "Hui Fang and Danning Zhang and Yiheng Shu and Guibing Guo", title = "Deep Learning for Sequential Recommendation: Algorithms, Influential Factors, and Evaluations", journal = j-TOIS, volume = "39", number = "1", pages = "10:1--10:42", month = jan, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3426723", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sun Mar 28 09:55:32 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3426723", abstract = "In the field of sequential recommendation, deep learning--(DL) based methods have received a lot of attention in the past few years and surpassed traditional models such as Markov chain-based and factorization-based ones. However, there is little \ldots{}", acknowledgement = ack-nhfb, articleno = "10", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Muntean:2021:WPE, author = "Cristina Ioana Muntean and Franco Maria Nardini and Raffaele Perego and Nicola Tonellotto and Ophir Frieder", title = "Weighting Passages Enhances Accuracy", journal = j-TOIS, volume = "39", number = "2", pages = "11:1--11:11", month = mar, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3428687", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu Apr 1 09:57:35 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3428687", abstract = "We observe that in curated documents the distribution of the occurrences of salient terms, e.g., terms with a high Inverse Document Frequency, is not uniform, and such terms are primarily concentrated towards the beginning and the end of the document. \ldots{}", acknowledgement = ack-nhfb, articleno = "11", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Gao:2021:LRY, author = "Shen Gao and Xiuying Chen and Li Liu and Dongyan Zhao and Rui Yan", title = "Learning to Respond with Your Favorite Stickers: a Framework of Unifying Multi-Modality and User Preference in Multi-Turn Dialog", journal = j-TOIS, volume = "39", number = "2", pages = "12:1--12:32", month = mar, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3429980", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu Apr 1 09:57:35 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3429980", abstract = "Stickers with vivid and engaging expressions are becoming increasingly popular in online messaging apps, and some works are dedicated to automatically select sticker response by matching the stickers image with previous utterances. However, existing \ldots{}", acknowledgement = ack-nhfb, articleno = "12", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Adomavicius:2021:EPA, author = "Gediminas Adomavicius and Jesse Bockstedt and Shawn Curley and Jingjing Zhang", title = "Effects of Personalized and Aggregate Top-{$N$} Recommendation Lists on User Preference Ratings", journal = j-TOIS, volume = "39", number = "2", pages = "13:1--13:38", month = mar, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3430028", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu Apr 1 09:57:35 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3430028", abstract = "Prior research has shown a robust effect of personalized product recommendations on user preference judgments for items. Specifically, the display of system-predicted preference ratings as item recommendations has been shown in multiple studies to bias \ldots{}", acknowledgement = ack-nhfb, articleno = "13", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Sakai:2021:REM, author = "Tetsuya Sakai and Zhaohao Zeng", title = "Retrieval Evaluation Measures that Agree with Users' {SERP} Preferences: Traditional, Preference-based, and Diversity Measures", journal = j-TOIS, volume = "39", number = "2", pages = "14:1--14:35", month = mar, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3431813", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu Apr 1 09:57:35 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3431813", abstract = "We examine the ``goodness'' of ranked retrieval evaluation measures in terms of how well they align with users' Search Engine Result Page (SERP) preferences for web search. The SERP preferences cover 1,127 topic-SERP-SERP triplets extracted from the NTCIR-. \ldots{}", acknowledgement = ack-nhfb, articleno = "14", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Liu:2021:MRA, author = "Peng Liu and Lemei Zhang and Jon Atle Gulla", title = "Multilingual Review-aware Deep Recommender System via Aspect-based Sentiment Analysis", journal = j-TOIS, volume = "39", number = "2", pages = "15:1--15:33", month = mar, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3432049", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu Apr 1 09:57:35 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3432049", abstract = "With the dramatic expansion of international markets, consumers write reviews in different languages, which poses a new challenge for Recommender Systems (RSs) dealing with this increasing amount of multilingual information. Recent studies that leverage \ldots{}", acknowledgement = ack-nhfb, articleno = "15", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wang:2021:TDU, author = "Chenyang Wang and Weizhi Ma and Min Zhang and Chong Chen and Yiqun Liu and Shaoping Ma", title = "Toward Dynamic User Intention: Temporal Evolutionary Effects of Item Relations in Sequential Recommendation", journal = j-TOIS, volume = "39", number = "2", pages = "16:1--16:33", month = mar, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3432244", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu Apr 1 09:57:35 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3432244", abstract = "User intention is an important factor to be considered for recommender systems, which always changes dynamically in different contexts. Recent studies (represented by sequential recommendation) begin to focus on predicting what users want beyond what \ldots{}", acknowledgement = ack-nhfb, articleno = "16", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{White:2021:MD, author = "Ryen W. White and Elnaz Nouri and James Woffinden-Luey and Mark Encarnaci{\'o}N and Sujay Kumar Jauhar", title = "Microtask Detection", journal = j-TOIS, volume = "39", number = "2", pages = "17:1--17:29", month = mar, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3432290", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu Apr 1 09:57:35 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3432290", abstract = "Information systems, such as task management applications and digital assistants, can help people keep track of tasks of different types and different time durations, ranging from a few minutes to days or weeks. Helping people better manage their tasks \ldots{}", acknowledgement = ack-nhfb, articleno = "17", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Gao:2021:MAG, author = "Shen Gao and Xiuying Chen and Zhaochun Ren and Dongyan Zhao and Rui Yan", title = "Meaningful Answer Generation of E-Commerce Question-Answering", journal = j-TOIS, volume = "39", number = "2", pages = "18:1--18:26", month = mar, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3432689", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu Apr 1 09:57:35 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3432689", abstract = "In e-commerce portals, generating answers for product-related questions has become a crucial task. In this article, we focus on the task of product-aware answer generation, which learns to generate an accurate and complete answer from large-scale \ldots{}", acknowledgement = ack-nhfb, articleno = "18", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Esuli:2021:CRS, author = "Andrea Esuli and Alessio Molinari and Fabrizio Sebastiani", title = "A Critical Reassessment of the {Saerens--Latinne--Decaestecker} Algorithm for Posterior Probability Adjustment", journal = j-TOIS, volume = "39", number = "2", pages = "19:1--19:34", month = mar, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3433164", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu Apr 1 09:57:35 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3433164", abstract = "We critically re-examine the Saerens-Latinne-Decaestecker (SLD) algorithm, a well-known method for estimating class prior probabilities (``priors'') and adjusting posterior probabilities (``posteriors'') in scenarios characterized by distribution shift, \ldots{}", acknowledgement = ack-nhfb, articleno = "19", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Dacrema:2021:TAR, author = "Maurizio Ferrari Dacrema and Simone Boglio and Paolo Cremonesi and Dietmar Jannach", title = "A Troubling Analysis of Reproducibility and Progress in Recommender Systems Research", journal = j-TOIS, volume = "39", number = "2", pages = "20:1--20:49", month = mar, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3434185", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu Apr 1 09:57:35 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3434185", abstract = "The design of algorithms that generate personalized ranked item lists is a central topic of research in the field of recommender systems. In the past few years, in particular, approaches based on deep learning (neural) techniques have become dominant in \ldots{}", acknowledgement = ack-nhfb, articleno = "20", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Ai:2021:ULR, author = "Qingyao Ai and Tao Yang and Huazheng Wang and Jiaxin Mao", title = "Unbiased Learning to Rank: Online or Offline?", journal = j-TOIS, volume = "39", number = "2", pages = "21:1--21:29", month = mar, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3439861", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu Apr 1 09:57:35 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3439861", abstract = "How to obtain an unbiased ranking model by learning to rank with biased user feedback is an important research question for IR. Existing work on unbiased learning to rank (ULTR) can be broadly categorized into two groups-the studies on unbiased learning \ldots{}", acknowledgement = ack-nhfb, articleno = "21", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wang:2021:VNV, author = "Wei Wang and Longbing Cao", title = "{VM-NSP}: Vertical Negative Sequential Pattern Mining with Loose Negative Element Constraints", journal = j-TOIS, volume = "39", number = "2", pages = "22:1--22:27", month = mar, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3440874", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu Apr 1 09:57:35 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3440874", abstract = "Negative sequential patterns (NSPs) capture more informative and actionable knowledge than classic positive sequential patterns (PSPs) due to the involvement of both occurring and nonoccurring behaviors and events, which can contribute to many relevant \ldots{}", acknowledgement = ack-nhfb, articleno = "22", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2021:EMN, author = "Min Zhang", title = "Editorial Message from the New {Editor-in-Chief}", journal = j-TOIS, volume = "39", number = "3", pages = "23e:1--23e:2", month = jul, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3447945", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue Aug 10 13:18:19 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3447945", acknowledgement = ack-nhfb, articleno = "23e", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Xu:2021:MMC, author = "Yanan Xu and Yanmin Zhu and Jiadi Yu", title = "Modeling Multiple Coexisting Category-Level Intentions for Next Item Recommendation", journal = j-TOIS, volume = "39", number = "3", pages = "23:1--23:24", month = jul, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3441642", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue Aug 10 13:18:19 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3441642", abstract = "Purchase intentions have a great impact on future purchases and thus can be exploited for making recommendations. However, purchase intentions are typically complex and may change from time to time. Through empirical study with two e-commerce datasets, we \ldots{}", acknowledgement = ack-nhfb, articleno = "23", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wang:2021:ISB, author = "Wei Wang and Longbing Cao", title = "Interactive Sequential Basket Recommendation by Learning Basket Couplings and Positive\slash Negative Feedback", journal = j-TOIS, volume = "39", number = "3", pages = "24:1--24:26", month = jul, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3444368", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue Aug 10 13:18:19 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3444368", abstract = "Sequential recommendation, such as next-basket recommender systems (NBRS), which model users' sequential behaviors and the relevant context/session, has recently attracted much attention from the research community. Existing session-based NBRS involve \ldots{}", acknowledgement = ack-nhfb, articleno = "24", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Liu:2021:TCU, author = "Hongtao Liu and Wenjun Wang and Qiyao Peng and Nannan Wu and Fangzhao Wu and Pengfei Jiao", title = "Toward Comprehensive User and Item Representations via Three-tier Attention Network", journal = j-TOIS, volume = "39", number = "3", pages = "25:1--25:22", month = jul, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3446341", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue Aug 10 13:18:19 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3446341", abstract = "Product reviews can provide rich information about the opinions users have of products. However, it is nontrivial to effectively infer user preference and item characteristics from reviews due to the complicated semantic understanding. Existing methods \ldots{}", acknowledgement = ack-nhfb, articleno = "25", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zeng:2021:RLB, author = "Weixin Zeng and Xiang Zhao and Jiuyang Tang and Xuemin Lin and Paul Groth", title = "Reinforcement Learning-based Collective Entity Alignment with Adaptive Features", journal = j-TOIS, volume = "39", number = "3", pages = "26:1--26:31", month = jul, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3446428", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue Aug 10 13:18:19 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3446428", abstract = "Entity alignment (EA) is the task of identifying the entities that refer to the same real-world object but are located in different knowledge graphs (KGs). For entities to be aligned, existing EA solutions treat them separately and generate alignment \ldots{}", acknowledgement = ack-nhfb, articleno = "26", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Yao:2021:RRL, author = "Jing Yao and Zhicheng Dou and Jun Xu and Ji-Rong Wen", title = "{RLPS}: a Reinforcement Learning-Based Framework for Personalized Search", journal = j-TOIS, volume = "39", number = "3", pages = "27:1--27:29", month = jul, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3446617", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue Aug 10 13:18:19 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3446617", abstract = "Personalized search is a promising way to improve search qualities by taking user interests into consideration. Recently, machine learning and deep learning techniques have been successfully applied to search result personalization. Most existing models \ldots{}", acknowledgement = ack-nhfb, articleno = "27", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wang:2021:DPR, author = "Jingyuan Wang and Xin Lin and Yuan Zuo and Junjie Wu", title = "{DGeye}: Probabilistic Risk Perception and Prediction for Urban Dangerous Goods Management", journal = j-TOIS, volume = "39", number = "3", pages = "28:1--28:30", month = jul, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3448256", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue Aug 10 13:18:19 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3448256", abstract = "Recent years have witnessed the emergence of worldwide megalopolises and the accompanying public safety events, making urban safety a top priority in modern urban management. Among various threats, dangerous goods such as gas and hazardous chemicals \ldots{}", acknowledgement = ack-nhfb, articleno = "28", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Aliannejadi:2021:CAT, author = "Mohammad Aliannejadi and Hamed Zamani and Fabio Crestani and W. Bruce Croft", title = "Context-aware Target Apps Selection and Recommendation for Enhancing Personal Mobile Assistants", journal = j-TOIS, volume = "39", number = "3", pages = "29:1--29:30", month = jul, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3447678", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue Aug 10 13:18:19 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3447678", abstract = "Users install many apps on their smartphones, raising issues related to information overload for users and resource management for devices. Moreover, the recent increase in the use of personal assistants has made mobile devices even more pervasive in \ldots{}", acknowledgement = ack-nhfb, articleno = "29", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Chen:2021:HFS, author = "Jia Chen and Jiaxin Mao and Yiqun Liu and Ziyi Ye and Weizhi Ma and Chao Wang and Min Zhang and Shaoping Ma", title = "A Hybrid Framework for Session Context Modeling", journal = j-TOIS, volume = "39", number = "3", pages = "30:1--30:35", month = jul, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3448127", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue Aug 10 13:18:19 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3448127", abstract = "Understanding user intent is essential for various retrieval tasks. By leveraging contextual information within sessions, e.g., query history and user click behaviors, search systems can capture user intent more accurately and thus perform better. However,. \ldots{}", acknowledgement = ack-nhfb, articleno = "30", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Vuong:2021:SCC, author = "Tung Vuong and Salvatore Andolina and Giulio Jacucci and Tuukka Ruotsalo", title = "Spoken Conversational Context Improves Query Auto-completion in {Web} Search", journal = j-TOIS, volume = "39", number = "3", pages = "31:1--31:32", month = jul, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3447875", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue Aug 10 13:18:19 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3447875", abstract = "Web searches often originate from conversations in which people engage before they perform a search. Therefore, conversations can be a valuable source of context with which to support the search process. We investigate whether spoken input from \ldots{}", acknowledgement = ack-nhfb, articleno = "31", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Yang:2021:HHG, author = "Tianchi Yang and Linmei Hu and Chuan Shi and Houye Ji and Xiaoli Li and Liqiang Nie", title = "{HGAT}: Heterogeneous Graph Attention Networks for Semi-supervised Short Text Classification", journal = j-TOIS, volume = "39", number = "3", pages = "32:1--32:29", month = jul, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3450352", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue Aug 10 13:18:19 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3450352", abstract = "Short text classification has been widely explored in news tagging to provide more efficient search strategies and more effective search results for information retrieval. However, most existing studies, concentrating on long text classification, deliver \ldots{}", acknowledgement = ack-nhfb, articleno = "32", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Clarke:2021:ATP, author = "Charles L. A. Clarke and Alexandra Vtyurina and Mark D. Smucker", title = "Assessing Top-$k$ Preferences", journal = j-TOIS, volume = "39", number = "3", pages = "33:1--33:21", month = jul, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3451161", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue Aug 10 13:18:19 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3451161", abstract = "Assessors make preference judgments faster and more consistently than graded judgments. Preference judgments can also recognize distinctions between items that appear equivalent under graded judgments. Unfortunately, preference judgments can require more \ldots{}", acknowledgement = ack-nhfb, articleno = "33", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Chen:2021:CEC, author = "Jiawei Chen and Chengquan Jiang and Can Wang and Sheng Zhou and Yan Feng and Chun Chen and Martin Ester and Xiangnan He", title = "{CoSam}: an Efficient Collaborative Adaptive Sampler for Recommendation", journal = j-TOIS, volume = "39", number = "3", pages = "34:1--34:24", month = jul, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3450289", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue Aug 10 13:18:19 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3450289", abstract = "Sampling strategies have been widely applied in many recommendation systems to accelerate model learning from implicit feedback data. A typical strategy is to draw negative instances with uniform distribution, which, however, will severely affect a model'. \ldots{}", acknowledgement = ack-nhfb, articleno = "34", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2021:ICR, author = "Chuxu Zhang and Huaxiu Yao and Lu Yu and Chao Huang and Dongjin Song and Haifeng Chen and Meng Jiang and Nitesh V. Chawla", title = "Inductive Contextual Relation Learning for Personalization", journal = j-TOIS, volume = "39", number = "3", pages = "35:1--35:22", month = jul, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3450353", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue Aug 10 13:18:19 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3450353", abstract = "Web personalization, e.g., recommendation or relevance search, tailoring a service/product to accommodate specific online users, is becoming increasingly important. Inductive personalization aims to infer the relations between existing entities and unseen \ldots{}", acknowledgement = ack-nhfb, articleno = "35", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Mena-Maldonado:2021:PBF, author = "Elisa Mena-Maldonado and Roc{\'\i}o Ca{\~n}amares and Pablo Castells and Yongli Ren and Mark Sanderson", title = "Popularity Bias in False-positive Metrics for Recommender Systems Evaluation", journal = j-TOIS, volume = "39", number = "3", pages = "36:1--36:43", month = jul, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3452740", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue Aug 10 13:18:19 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3452740", abstract = "We investigate the impact of popularity bias in false-positive metrics in the offline evaluation of recommender systems. Unlike their true-positive complements, false-positive metrics reward systems that minimize recommendations disliked by users. Our \ldots{}", acknowledgement = ack-nhfb, articleno = "36", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2021:ERT, author = "Qi Zhang and Hengshu Zhu and Qi Liu and Enhong Chen and Hui Xiong", title = "Exploiting Real-time Search Engine Queries for Earthquake Detection: a Summary of Results", journal = j-TOIS, volume = "39", number = "3", pages = "37:1--37:32", month = jul, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3453842", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue Aug 10 13:18:19 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3453842", abstract = "Online search engine has been widely regarded as the most convenient approach for information acquisition. Indeed, the intensive information-seeking behaviors of search engine users make it possible to exploit search engine queries as effective ``crowd \ldots{}''", acknowledgement = ack-nhfb, articleno = "37", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Hauff:2021:CSR, author = "Claudia Hauff and Julia Kiseleva and Mark Sanderson and Hamed Zamani and Yongfeng Zhang", title = "Conversational Search and Recommendation: Introduction to the Special Issue", journal = j-TOIS, volume = "39", number = "4", pages = "38:1--38:6", month = oct, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3465272", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Oct 23 06:30:06 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3465272", acknowledgement = ack-nhfb, articleno = "38", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Thomas:2021:TCC, author = "Paul Thomas and Mary Czerwinksi and Daniel Mcduff and Nick Craswell", title = "Theories of Conversation for Conversational {IR}", journal = j-TOIS, volume = "39", number = "4", pages = "39:1--39:23", month = oct, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3439869", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Oct 23 06:30:06 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3439869", abstract = "Conversational information retrieval is a relatively new and fast-developing research area, but conversation itself has been well studied for decades. Researchers have analysed linguistic phenomena such as structure and semantics but also paralinguistic \ldots{}", acknowledgement = ack-nhfb, articleno = "39", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Li:2021:SUA, author = "Shijun Li and Wenqiang Lei and Qingyun Wu and Xiangnan He and Peng Jiang and Tat-Seng Chua", title = "Seamlessly Unifying Attributes and Items: Conversational Recommendation for Cold-start Users", journal = j-TOIS, volume = "39", number = "4", pages = "40:1--40:29", month = oct, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3446427", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Oct 23 06:30:06 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3446427", abstract = "Static recommendation methods like collaborative filtering suffer from the inherent limitation of performing real-time personalization for cold-start users. Online recommendation, e.g., multi-armed bandit approach, addresses this limitation by \ldots{}", acknowledgement = ack-nhfb, articleno = "40", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Contreras:2021:ICL, author = "David Contreras and Maria Salam{\'o} and Ludovico Boratto", title = "Integrating Collaboration and Leadership in Conversational Group Recommender Systems", journal = j-TOIS, volume = "39", number = "4", pages = "41:1--41:32", month = oct, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3462759", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Oct 23 06:30:06 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3462759", abstract = "Recent observational studies highlight the importance of considering the interactions between users in the group recommendation process, but to date their integration has been marginal. In this article, we propose a collaborative model based on the social \ldots{}", acknowledgement = ack-nhfb, articleno = "41", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wilkinson:2021:WWE, author = "Daricia Wilkinson and {\"O}znur Alkan and Q. Vera Liao and Massimiliano Mattetti and Inge Vejsbjerg and Bart P. Knijnenburg and Elizabeth Daly", title = "Why or Why Not? {The} Effect of Justification Styles on Chatbot Recommendations", journal = j-TOIS, volume = "39", number = "4", pages = "42:1--42:21", month = oct, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3441715", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Oct 23 06:30:06 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3441715", abstract = "Chatbots or conversational recommenders have gained increasing popularity as a new paradigm for Recommender Systems (RS). Prior work on RS showed that providing explanations can improve transparency and trust, which are critical for the adoption of RS. \ldots{}", acknowledgement = ack-nhfb, articleno = "42", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wei:2021:TGE, author = "Wei Wei and Jiayi Liu and Xianling Mao and Guibing Guo and Feida Zhu and Pan Zhou and Yuchong Hu and Shanshan Feng", title = "Target-guided Emotion-aware Chat Machine", journal = j-TOIS, volume = "39", number = "4", pages = "43:1--43:24", month = oct, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3456414", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Oct 23 06:30:06 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3456414", abstract = "The consistency of a response to a given post at the semantic level and emotional level is essential for a dialogue system to deliver humanlike interactions. However, this challenge is not well addressed in the literature, since most of the approaches \ldots{}", acknowledgement = ack-nhfb, articleno = "43", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Xu:2021:RRM, author = "Ruijian Xu and Chongyang Tao and Jiazhan Feng and Wei Wu and Rui Yan and Dongyan Zhao", title = "Response Ranking with Multi-types of Deep Interactive Representations in Retrieval-based Dialogues", journal = j-TOIS, volume = "39", number = "4", pages = "44:1--44:28", month = oct, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3462207", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Oct 23 06:30:06 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3462207", abstract = "Building an intelligent dialogue system with the ability to select a proper response according to a multi-turn context is challenging in three aspects: (1) the meaning of a context-response pair is built upon language units from multiple granularities \ldots{}", acknowledgement = ack-nhfb, articleno = "44", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Li:2021:DHM, author = "Juntao Li and Chang Liu and Chongyang Tao and Zhangming Chan and Dongyan Zhao and Min Zhang and Rui Yan", title = "Dialogue History Matters! {Personalized} Response Selection in Multi-Turn Retrieval-Based Chatbots", journal = j-TOIS, volume = "39", number = "4", pages = "45:1--45:25", month = oct, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3453183", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Oct 23 06:30:06 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3453183", abstract = "Existing multi-turn context-response matching methods mainly concentrate on obtaining multi-level and multi-dimension representations and better interactions between context utterances and response. However, in real-place conversation scenarios, whether a \ldots{}", acknowledgement = ack-nhfb, articleno = "45", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Musto:2021:MDA, author = "Cataldo Musto and Fedelucio Narducci and Marco Polignano and Marco {De Gemmis} and Pasquale Lops and Giovanni Semeraro", title = "{MyrrorBot}: a Digital Assistant Based on Holistic User Models for Personalized Access to Online Services", journal = j-TOIS, volume = "39", number = "4", pages = "46:1--46:34", month = oct, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3447679", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Oct 23 06:30:06 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3447679", abstract = "In this article, we present MyrrorBot, a personal digital assistant implementing a natural language interface that allows the users to: (i) access online services, such as music, video, news, and food recommendation s, in a personalized way, by exploiting a \ldots{}", acknowledgement = ack-nhfb, articleno = "46", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Ren:2021:CSE, author = "Pengjie Ren and Zhumin Chen and Zhaochun Ren and Evangelos Kanoulas and Christof Monz and Maarten {De Rijke}", title = "Conversations with Search Engines: {SERP-based} Conversational Response Generation", journal = j-TOIS, volume = "39", number = "4", pages = "47:1--47:29", month = oct, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3432726", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Oct 23 06:30:06 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3432726", abstract = "In this article, we address the problem of answering complex information needs by conducting conversations with search engines, in the sense that users can express their queries in natural language and directly receive the information they need from a \ldots{}", acknowledgement = ack-nhfb, articleno = "47", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Lin:2021:MSC, author = "Sheng-Chieh Lin and Jheng-Hong Yang and Rodrigo Nogueira and Ming-Feng Tsai and Chuan-Ju Wang and Jimmy Lin", title = "Multi-Stage Conversational Passage Retrieval: an Approach to Fusing Term Importance Estimation and Neural Query Rewriting", journal = j-TOIS, volume = "39", number = "4", pages = "48:1--48:29", month = oct, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3446426", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Oct 23 06:30:06 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3446426", abstract = "Conversational search plays a vital role in conversational information seeking. As queries in information seeking dialogues are ambiguous for traditional ad hoc information retrieval (IR) systems due to the coreference and omission resolution problems \ldots{}", acknowledgement = ack-nhfb, articleno = "48", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Vakulenko:2021:LSA, author = "Svitlana Vakulenko and Evangelos Kanoulas and Maarten {De Rijke}", title = "A Large-scale Analysis of Mixed Initiative in Information-Seeking Dialogues for Conversational Search", journal = j-TOIS, volume = "39", number = "4", pages = "49:1--49:32", month = oct, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3466796", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Oct 23 06:30:06 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3466796", abstract = "Conversational search is a relatively young area of research that aims at automating an information-seeking dialogue. In this article, we help to position it with respect to other research areas within conversational artificial intelligence (AI) by \ldots{}", acknowledgement = ack-nhfb, articleno = "49", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Kiesel:2021:MIC, author = "Johannes Kiesel and Lars Meyer and Martin Potthast and Benno Stein", title = "Meta-Information in Conversational Search", journal = j-TOIS, volume = "39", number = "4", pages = "50:1--50:44", month = oct, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3468868", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Oct 23 06:30:06 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3468868", abstract = "The exchange of meta-information has always formed part of information behavior. In this article, we show that this rule also extends to conversational search. Information about the user's information need, their preferences, and the quality of search \ldots{}", acknowledgement = ack-nhfb, articleno = "50", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Lipani:2021:HDE, author = "Aldo Lipani and Ben Carterette and Emine Yilmaz", title = "How Am {I} Doing?: Evaluating Conversational Search Systems Offline", journal = j-TOIS, volume = "39", number = "4", pages = "51:1--51:22", month = oct, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3451160", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Oct 23 06:30:06 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3451160", abstract = "As conversational agents like Siri and Alexa gain in popularity and use, conversation is becoming a more and more important mode of interaction for search. Conversational search shares some features with traditional search, but differs in some important \ldots{}", acknowledgement = ack-nhfb, articleno = "51", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Liu:2021:MEC, author = "Zeyang Liu and Ke Zhou and Max L. Wilson", title = "Meta-evaluation of Conversational Search Evaluation Metrics", journal = j-TOIS, volume = "39", number = "4", pages = "52:1--52:42", month = oct, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3445029", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Oct 23 06:30:06 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3445029", abstract = "Conversational search systems, such as Google assistant and Microsoft Cortana, enable users to interact with search systems in multiple rounds through natural language dialogues. Evaluating such systems is very challenging, given that any natural language \ldots{}", acknowledgement = ack-nhfb, articleno = "52", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Corno:2021:UII, author = "Fulvio Corno and Luigi {De Russis} and Alberto Monge Roffarello", title = "From Users' Intentions to {IF--THEN} Rules in the {Internet of Things}", journal = j-TOIS, volume = "39", number = "4", pages = "53:1--53:33", month = oct, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3447264", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Oct 23 06:30:06 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3447264", abstract = "In the Internet of Things era, users are willing to personalize the joint behavior of their connected entities, i.e., smart devices and online service, by means of trigger-action rules such as ``IF the entrance Nest security camera detects a movement, THEN \ldots{}''", acknowledgement = ack-nhfb, articleno = "53", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Yan:2021:MRA, author = "Rui Yan and Weiheng Liao and Dongyan Zhao and Ji-Rong Wen", title = "Multi-Response Awareness for Retrieval-Based Conversations: Respond with Diversity via Dynamic Representation Learning", journal = j-TOIS, volume = "39", number = "4", pages = "54:1--54:29", month = oct, year = "2021", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3470450", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Oct 23 06:30:06 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3470450", abstract = "Conversational systems now attract great attention due to their promising potential and commercial values. To build a conversational system with moderate intelligence is challenging and requires big (conversational) data, as well as interdisciplinary \ldots{}", acknowledgement = ack-nhfb, articleno = "54", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Patil:2022:GTA, author = "Shubham Patil and Debopriyo Banerjee and Shamik Sural", title = "A Graph Theoretic Approach for Multi-Objective Budget Constrained Capsule Wardrobe Recommendation", journal = j-TOIS, volume = "40", number = "1", pages = "1:1--1:33", month = jan, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3457182", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Jan 5 13:39:59 MST 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3457182", abstract = "Traditionally, capsule wardrobes are manually designed by expert fashionistas through their creativity and technical prowess. The goal is to curate minimal fashion items that can be assembled into several compatible and versatile outfits. It is usually a \ldots{}", acknowledgement = ack-nhfb, articleno = "1", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Deng:2022:CKA, author = "Yang Deng and Yuexiang Xie and Yaliang Li and Min Yang and Wai Lam and Ying Shen", title = "Contextualized Knowledge-aware Attentive Neural Network: Enhancing Answer Selection with Knowledge", journal = j-TOIS, volume = "40", number = "1", pages = "2:1--2:33", month = jan, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3457533", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Jan 5 13:39:59 MST 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3457533", abstract = "Answer selection, which is involved in many natural language processing applications, such as dialog systems and question answering (QA), is an important yet challenging task in practice, since conventional methods typically suffer from the issues of \ldots{}", acknowledgement = ack-nhfb, articleno = "2", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Guo:2022:HHE, author = "Lei Guo and Hongzhi Yin and Tong Chen and Xiangliang Zhang and Kai Zheng", title = "Hierarchical Hyperedge Embedding-Based Representation Learning for Group Recommendation", journal = j-TOIS, volume = "40", number = "1", pages = "3:1--3:27", month = jan, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3457949", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Jan 5 13:39:59 MST 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3457949", abstract = "Group recommendation aims to recommend items to a group of users. In this work, we study group recommendation in a particular scenario, namely occasional group recommendation, where groups are formed ad hoc and users may just constitute a group for the \ldots{}", acknowledgement = ack-nhfb, articleno = "3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Jadidinejad:2022:SPO, author = "Amir H. Jadidinejad and Craig Macdonald and Iadh Ounis", title = "The {Simpson's Paradox} in the Offline Evaluation of Recommendation Systems", journal = j-TOIS, volume = "40", number = "1", pages = "4:1--4:22", month = jan, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3458509", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Jan 5 13:39:59 MST 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3458509", abstract = "Recommendation systems are often evaluated based on user's interactions that were collected from an existing, already deployed recommendation system. In this situation, users only provide feedback on the exposed items and they may not leave feedback on \ldots{}", acknowledgement = ack-nhfb, articleno = "4", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Bahrainian:2022:CCA, author = "Seyed Ali Bahrainian and George Zerveas and Fabio Crestani and Carsten Eickhoff", title = "{CATS}: Customizable Abstractive Topic-based Summarization", journal = j-TOIS, volume = "40", number = "1", pages = "5:1--5:24", month = jan, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3464299", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Jan 5 13:39:59 MST 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3464299", abstract = "Neural sequence-to-sequence models are the state-of-the-art approach used in abstractive summarization of textual documents, useful for producing condensed versions of source text narratives without being restricted to using only words from the original \ldots{}", acknowledgement = ack-nhfb, articleno = "5", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Mu:2022:KGD, author = "Shanlei Mu and Yaliang Li and Wayne Xin Zhao and Siqing Li and Ji-Rong Wen", title = "Knowledge-Guided Disentangled Representation Learning for Recommender Systems", journal = j-TOIS, volume = "40", number = "1", pages = "6:1--6:26", month = jan, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3464304", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Jan 5 13:39:59 MST 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3464304", abstract = "In recommender systems, it is essential to understand the underlying factors that affect user-item interaction. Recently, several studies have utilized disentangled representation learning to discover such hidden factors from user-item interaction data, \ldots{}", acknowledgement = ack-nhfb, articleno = "6", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zang:2022:CCH, author = "Hongyu Zang and Dongcheng Han and Xin Li and Zhifeng Wan and Mingzhong Wang", title = "{CHA}: Categorical Hierarchy-based Attention for Next {POI} Recommendation", journal = j-TOIS, volume = "40", number = "1", pages = "7:1--7:22", month = jan, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3464300", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Jan 5 13:39:59 MST 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3464300", abstract = "Next Point-of-interest (POI) recommendation is a key task in improving location-related customer experiences and business operations, but yet remains challenging due to the substantial diversity of human activities and the sparsity of the check-in records \ldots{}", acknowledgement = ack-nhfb, articleno = "7", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Tian:2022:WHL, author = "Yuan Tian and Ke Zhou and Dan Pelleg", title = "What and How long: Prediction of Mobile App Engagement", journal = j-TOIS, volume = "40", number = "1", pages = "8:1--8:38", month = jan, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3464301", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Jan 5 13:39:59 MST 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3464301", abstract = "User engagement is crucial to the long-term success of a mobile app. Several metrics, such as dwell time, have been used for measuring user engagement. However, how to effectively predict user engagement in the context of mobile apps is still an open \ldots{}", acknowledgement = ack-nhfb, articleno = "8", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Ma:2022:UTE, author = "Longxuan Ma and Mingda Li and Wei-Nan Zhang and Jiapeng Li and Ting Liu", title = "Unstructured Text Enhanced Open-Domain Dialogue System: a Systematic Survey", journal = j-TOIS, volume = "40", number = "1", pages = "9:1--9:44", month = jan, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3464377", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Jan 5 13:39:59 MST 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3464377", abstract = "Incorporating external knowledge into dialogue generation has been proven to benefit the performance of an open-domain Dialogue System (DS), such as generating informative or stylized responses, controlling conversation topics. In this article, we study \ldots{}", acknowledgement = ack-nhfb, articleno = "9", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Xia:2022:CRA, author = "Lianghao Xia and Chao Huang and Yong Xu and Huance Xu and Xiang Li and Weiguo Zhang", title = "Collaborative Reflection-Augmented Autoencoder Network for Recommender Systems", journal = j-TOIS, volume = "40", number = "1", pages = "10:1--10:22", month = jan, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3467023", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Jan 5 13:39:59 MST 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3467023", abstract = "As the deep learning techniques have expanded to real-world recommendation tasks, many deep neural network based Collaborative Filtering (CF) models have been developed to project user-item interactions into latent feature space, based on various neural \ldots{}", acknowledgement = ack-nhfb, articleno = "10", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Li:2022:IAA, author = "Siqing Li and Yaliang Li and Wayne Xin Zhao and Bolin Ding and Ji-Rong Wen", title = "Interpretable Aspect-Aware Capsule Network for Peer Review Based Citation Count Prediction", journal = j-TOIS, volume = "40", number = "1", pages = "11:1--11:29", month = jan, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3466640", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Jan 5 13:39:59 MST 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3466640", abstract = "Citation count prediction is an important task for estimating the future impact of research papers. Most of the existing works utilize the information extracted from the paper itself. In this article, we focus on how to utilize another kind of useful data \ldots{}", acknowledgement = ack-nhfb, articleno = "11", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2022:QTG, author = "Xiao Zhang and Meng Liu and Jianhua Yin and Zhaochun Ren and Liqiang Nie", title = "Question Tagging via Graph-guided Ranking", journal = j-TOIS, volume = "40", number = "1", pages = "12:1--12:23", month = jan, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3468270", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Jan 5 13:39:59 MST 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3468270", abstract = "With the increasing prevalence of portable devices and the popularity of community Question Answering (cQA) sites, users can seamlessly post and answer many questions. To effectively organize the information for precise recommendation and easy searching, \ldots{}", acknowledgement = ack-nhfb, articleno = "12", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Mackenzie:2022:ARD, author = "Joel Mackenzie and Matthias Petri and Alistair Moffat", title = "Anytime Ranking on Document-Ordered Indexes", journal = j-TOIS, volume = "40", number = "1", pages = "13:1--13:32", month = jan, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3467890", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Jan 5 13:39:59 MST 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3467890", abstract = "Inverted indexes continue to be a mainstay of text search engines, allowing efficient querying of large document collections. While there are a number of possible organizations, document-ordered indexes are the most common, since they are amenable to various query types, support index updates, and allow for efficient dynamic pruning operations. One disadvantage with document-ordered indexes is that high-scoring documents can be distributed across the document identifier space, meaning that index traversal algorithms that terminate early might put search effectiveness at risk. The alternative is impact-ordered indexes, which primarily support top-disjunctions but also allow for anytime query processing, where the search can be terminated at any time, with search quality improving as processing latency increases. Anytime query processing can be used to effectively reduce high-percentile tail latency that is essential for operational scenarios in which a service level agreement (SLA) imposes response time requirements. In this work, we show how document-ordered indexes can be organized such that they can be queried in an anytime fashion, enabling strict latency control with effective early termination. Our experiments show that processing document-ordered topical segments selected by a simple score estimator outperforms existing anytime algorithms, and allows query runtimes to be accurately limited to comply with SLA requirements.", acknowledgement = ack-nhfb, articleno = "13", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2022:RQG, author = "Ruqing Zhang and Jiafeng Guo and Lu Chen and Yixing Fan and Xueqi Cheng", title = "A Review on Question Generation from Natural Language Text", journal = j-TOIS, volume = "40", number = "1", pages = "14:1--14:43", month = jan, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3468889", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Jan 5 13:39:59 MST 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3468889", abstract = "Question generation is an important yet challenging problem in Artificial Intelligence (AI), which aims to generate natural and relevant questions from various input formats, e.g., natural language text, structure database, knowledge base, and image. In \ldots{}", acknowledgement = ack-nhfb, articleno = "14", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Shen:2022:JRL, author = "Dazhong Shen and Chuan Qin and Hengshu Zhu and Tong Xu and Enhong Chen and Hui Xiong", title = "Joint Representation Learning with Relation-Enhanced Topic Models for Intelligent Job Interview Assessment", journal = j-TOIS, volume = "40", number = "1", pages = "15:1--15:36", month = jan, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3469654", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Jan 5 13:39:59 MST 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3469654", abstract = "The job interview is considered as one of the most essential tasks in talent recruitment, which forms a bridge between candidates and employers in fitting the right person for the right job. While substantial efforts have been made on improving the job \ldots{}", acknowledgement = ack-nhfb, articleno = "15", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wu:2022:KPD, author = "Hanrui Wu and Qingyao Wu and Michael K. Ng", title = "Knowledge Preserving and Distribution Alignment for Heterogeneous Domain Adaptation", journal = j-TOIS, volume = "40", number = "1", pages = "16:1--16:29", month = jan, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3469856", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Jan 5 13:39:59 MST 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3469856", abstract = "Domain adaptation aims at improving the performance of learning tasks in a target domain by leveraging the knowledge extracted from a source domain. To this end, one can perform knowledge transfer between these two domains. However, this problem becomes \ldots{}", acknowledgement = ack-nhfb, articleno = "16", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Shen:2022:UPB, author = "Jiaxing Shen and Jiannong Cao and Oren Lederman and Shaojie Tang and Alex ``Sandy'' Pentland", title = "User Profiling Based on Nonlinguistic Audio Data", journal = j-TOIS, volume = "40", number = "1", pages = "17:1--17:23", month = jan, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3474826", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Jan 5 13:39:59 MST 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3474826", abstract = "User profiling refers to inferring people's attributes of interest (AoIs) like gender and occupation, which enables various applications ranging from personalized services to collective analyses. Massive nonlinguistic audio data brings a novel opportunity \ldots{}", acknowledgement = ack-nhfb, articleno = "17", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Mustar:2022:STQ, author = "Agn{\`e}s Mustar and Sylvain Lamprier and Benjamin Piwowarski", title = "On the Study of Transformers for Query Suggestion", journal = j-TOIS, volume = "40", number = "1", pages = "18:1--18:27", month = jan, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3470562", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Jan 5 13:39:59 MST 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3470562", abstract = "When conducting a search task, users may find it difficult to articulate their need, even more so when the task is complex. To help them complete their search, search engine usually provide query suggestions. A good query suggestion system requires to \ldots{}", acknowledgement = ack-nhfb, articleno = "18", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Culpepper:2022:TDC, author = "J. Shane Culpepper and Guglielmo Faggioli and Nicola Ferro and Oren Kurland", title = "Topic Difficulty: Collection and Query Formulation Effects", journal = j-TOIS, volume = "40", number = "1", pages = "19:1--19:36", month = jan, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3470563", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Jan 5 13:39:59 MST 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3470563", abstract = "Several recent studies have explored the interaction effects between topics, systems, corpora, and components when measuring retrieval effectiveness. However, all of these previous studies assume that a topic or information need is represented by a single \ldots{}", acknowledgement = ack-nhfb, articleno = "19", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Chen:2022:MID, author = "Wanyu Chen and Pengjie Ren and Fei Cai and Fei Sun and Maarten {De Rijke}", title = "Multi-interest Diversification for End-to-end Sequential Recommendation", journal = j-TOIS, volume = "40", number = "1", pages = "20:1--20:30", month = jan, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3475768", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Jan 5 13:39:59 MST 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3475768", abstract = "Sequential recommenders capture dynamic aspects of users' interests by modeling sequential behavior. Previous studies on sequential recommendations mostly aim to identify users' main recent interests to optimize the recommendation accuracy; they often \ldots{}", acknowledgement = ack-nhfb, articleno = "20", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{He:2022:GTU, author = "Xiangnan He and Zhaochun Ren and Emine Yilmaz and Marc Najork and Tat-Seng Chua", title = "Graph Technologies for User Modeling and Recommendation: Introduction to the Special Issue --- {Part 1}", journal = j-TOIS, volume = "40", number = "2", pages = "21:1--21:5", month = apr, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3477596", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Feb 2 08:14:20 MST 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3477596", acknowledgement = ack-nhfb, articleno = "21", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Gatmiry:2022:NVP, author = "Khashayar Gatmiry and Manuel Gomez-Rodriguez", title = "The Network Visibility Problem", journal = j-TOIS, volume = "40", number = "2", pages = "22:1--22:42", month = apr, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3460475", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Feb 2 08:14:20 MST 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3460475", abstract = "Social media is an attention economy where broadcasters are constantly competing for attention in their followers' feeds. Broadcasters are likely to elicit greater attention from their followers if their posts remain visible at the top of their followers' \ldots{}", acknowledgement = ack-nhfb, articleno = "22", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Cui:2022:SKA, author = "Yue Cui and Hao Sun and Yan Zhao and Hongzhi Yin and Kai Zheng", title = "Sequential-Knowledge-Aware Next {POI} Recommendation: a Meta-Learning Approach", journal = j-TOIS, volume = "40", number = "2", pages = "23:1--23:22", month = apr, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3460198", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Feb 2 08:14:20 MST 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3460198", abstract = "Accurately recommending the next point of interest (POI) has become a fundamental problem with the rapid growth of location-based social networks. However, sparse, imbalanced check-in data and diverse user check-in patterns pose severe challenges for POI \ldots{}", acknowledgement = ack-nhfb, articleno = "23", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wang:2022:HEH, author = "Hao Wang and Defu Lian and Hanghang Tong and Qi Liu and Zhenya Huang and Enhong Chen", title = "{HyperSoRec}: Exploiting Hyperbolic User and Item Representations with Multiple Aspects for Social-aware Recommendation", journal = j-TOIS, volume = "40", number = "2", pages = "24:1--24:28", month = apr, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3463913", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Feb 2 08:14:20 MST 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3463913", abstract = "Social recommendation has achieved great success in many domains including e-commerce and location-based social networks. Existing methods usually explore the user-item interactions or user-user connections to predict users' preference behaviors. However, \ldots{}", acknowledgement = ack-nhfb, articleno = "24", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Dai:2022:BRR, author = "Xinyi Dai and Yunjia Xi and Weinan Zhang and Qing Liu and Ruiming Tang and Xiuqiang He and Jiawei Hou and Jun Wang and Yong Yu", title = "Beyond Relevance Ranking: a General Graph Matching Framework for Utility-Oriented Learning to Rank", journal = j-TOIS, volume = "40", number = "2", pages = "25:1--25:29", month = apr, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3464303", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Feb 2 08:14:20 MST 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3464303", abstract = "Learning to rank from logged user feedback, such as clicks or purchases, is a central component of many real-world information systems. Different from human-annotated relevance labels, the user feedback is always noisy and biased. Many existing learning \ldots{}", acknowledgement = ack-nhfb, articleno = "25", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2022:LSC, author = "Wei Zhang and Zeyuan Chen and Hongyuan Zha and Jianyong Wang", title = "Learning from Substitutable and Complementary Relations for Graph-based Sequential Product Recommendation", journal = j-TOIS, volume = "40", number = "2", pages = "26:1--26:28", month = apr, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3464302", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Feb 2 08:14:20 MST 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3464302", abstract = "Sequential product recommendation, aiming at predicting the products that a target user will interact with soon, has become a hotspot topic. Most of the sequential recommendation models focus on learning from users' interacted product sequences in a \ldots{}", acknowledgement = ack-nhfb, articleno = "26", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Tian:2022:EGI, author = "Zhiqiang Tian and Yezheng Liu and Jianshan Sun and Yuanchun Jiang and Mingyue Zhu", title = "Exploiting Group Information for Personalized Recommendation with Graph Neural Networks", journal = j-TOIS, volume = "40", number = "2", pages = "27:1--27:23", month = apr, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3464764", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Feb 2 08:14:20 MST 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3464764", abstract = "Personalized recommendation has become more and more important for users to quickly find relevant items. The key issue of the recommender system is how to model user preferences. Previous work mostly employed user historical data to learn users' \ldots{}", acknowledgement = ack-nhfb, articleno = "27", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2022:MGH, author = "Chengyuan Zhang and Yang Wang and Lei Zhu and Jiayu Song and Hongzhi Yin", title = "Multi-Graph Heterogeneous Interaction Fusion for Social Recommendation", journal = j-TOIS, volume = "40", number = "2", pages = "28:1--28:26", month = apr, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3466641", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Feb 2 08:14:20 MST 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3466641", abstract = "With the rapid development of online social recommendation system, substantial methods have been proposed. Unlike traditional recommendation system, social recommendation performs by integrating social relationship features, where there are two major \ldots{}", acknowledgement = ack-nhfb, articleno = "28", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhou:2022:DAU, author = "Sheng Zhou and Xin Wang and Martin Ester and Bolang Li and Chen Ye and Zhen Zhang and Can Wang and Jiajun Bu", title = "Direction-Aware User Recommendation Based on Asymmetric Network Embedding", journal = j-TOIS, volume = "40", number = "2", pages = "29:1--29:23", month = apr, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3466754", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Feb 2 08:14:20 MST 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3466754", abstract = "User recommendation aims at recommending users with potential interests in the social network. Previous works have mainly focused on the undirected social networks with symmetric relationship such as friendship, whereas recent advances have been made on \ldots{}", acknowledgement = ack-nhfb, articleno = "29", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Huang:2022:LLC, author = "Xiaowen Huang and Jitao Sang and Jian Yu and Changsheng Xu", title = "Learning to Learn a Cold-start Sequential Recommender", journal = j-TOIS, volume = "40", number = "2", pages = "30:1--30:25", month = apr, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3466753", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Feb 2 08:14:20 MST 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3466753", abstract = "The cold-start recommendation is an urgent problem in contemporary online applications. It aims to provide users whose behaviors are literally sparse with as accurate recommendations as possible. Many data-driven algorithms, such as the widely used matrix \ldots{}", acknowledgement = ack-nhfb, articleno = "30", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhao:2022:BFG, author = "Minghao Zhao and Qilin Deng and Kai Wang and Runze Wu and Jianrong Tao and Changjie Fan and Liang Chen and Peng Cui", title = "Bilateral Filtering Graph Convolutional Network for Multi-relational Social Recommendation in the Power-law Networks", journal = j-TOIS, volume = "40", number = "2", pages = "31:1--31:24", month = apr, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3469799", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Feb 2 08:14:20 MST 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3469799", abstract = "In recent years, advances in Graph Convolutional Networks (GCNs) have given new insights into the development of social recommendation. However, many existing GCN-based social recommendation methods often directly apply GCN to capture user-item and user-. \ldots{}", acknowledgement = ack-nhfb, articleno = "31", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Mansoury:2022:GBA, author = "Masoud Mansoury and Himan Abdollahpouri and Mykola Pechenizkiy and Bamshad Mobasher and Robin Burke", title = "A Graph-Based Approach for Mitigating Multi-Sided Exposure Bias in Recommender Systems", journal = j-TOIS, volume = "40", number = "2", pages = "32:1--32:31", month = apr, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3470948", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Feb 2 08:14:20 MST 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3470948", abstract = "Fairness is a critical system-level objective in recommender systems that has been the subject of extensive recent research. A specific form of fairness is supplier exposure fairness, where the objective is to ensure equitable coverage of items across all \ldots{}", acknowledgement = ack-nhfb, articleno = "32", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Yang:2022:LLI, author = "Jun Yang and Weizhi Ma and Min Zhang and Xin Zhou and Yiqun Liu and Shaoping Ma", title = "{LegalGNN}: Legal Information Enhanced Graph Neural Network for Recommendation", journal = j-TOIS, volume = "40", number = "2", pages = "33:1--33:29", month = apr, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3469887", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Feb 2 08:14:20 MST 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3469887", abstract = "Recommendation in legal scenario (Legal-Rec) is a specialized recommendation task that aims to provide potential helpful legal documents for users. While there are mainly three differences compared with traditional recommendation: (1) Both the structural \ldots{}", acknowledgement = ack-nhfb, articleno = "33", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Liang:2022:PUQ, author = "Shangsong Liang and Yupeng Luo and Zaiqiao Meng", title = "Profiling Users for Question Answering Communities via Flow-Based Constrained Co-Embedding Model", journal = j-TOIS, volume = "40", number = "2", pages = "34:1--34:38", month = apr, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3470565", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Feb 2 08:14:20 MST 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3470565", abstract = "In this article, we study the task of user profiling in question answering communities (QACs). Previous user profiling algorithms suffer from a number of defects: they regard users and words as atomic units, leading to the mismatch between them; they are \ldots{}", acknowledgement = ack-nhfb, articleno = "34", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Qiu:2022:EPI, author = "Ruihong Qiu and Zi Huang and Tong Chen and Hongzhi Yin", title = "Exploiting Positional Information for Session-Based Recommendation", journal = j-TOIS, volume = "40", number = "2", pages = "35:1--35:24", month = apr, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3473339", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Feb 2 08:14:20 MST 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3473339", abstract = "For present e-commerce platforms, it is important to accurately predict users' preference for a timely next-item recommendation. To achieve this goal, session-based recommender systems are developed, which are based on a sequence of the most recent user-. \ldots{}", acknowledgement = ack-nhfb, articleno = "35", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Pan:2022:PSA, author = "Yaoxin Pan and Shangsong Liang and Jiaxin Ren and Zaiqiao Meng and Qiang Zhang", title = "Personalized, Sequential, Attentive, Metric-Aware Product Search", journal = j-TOIS, volume = "40", number = "2", pages = "36:1--36:29", month = apr, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3473337", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Feb 2 08:14:20 MST 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3473337", abstract = "The task of personalized product search aims at retrieving a ranked list of products given a user's input query and his/her purchase history. To address this task, we propose the PSAM model, a Personalized, Sequential, Attentive and Metric-aware (PSAM) \ldots{}", acknowledgement = ack-nhfb, articleno = "36", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Li:2022:SGF, author = "Hui Li and Lianyun Li and Guipeng Xv and Chen Lin and Ke Li and Bingchuan Jiang", title = "{SPEX}: a Generic Framework for Enhancing Neural Social Recommendation", journal = j-TOIS, volume = "40", number = "2", pages = "37:1--37:33", month = apr, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3473338", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Feb 2 08:14:20 MST 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3473338", abstract = "Social Recommender Systems (SRS) have attracted considerable attention since its accompanying service, social networks, helps increase user satisfaction and provides auxiliary information to improve recommendations. However, most existing SRS focus on \ldots{}", acknowledgement = ack-nhfb, articleno = "37", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhu:2022:LHI, author = "Nengjun Zhu and Jian Cao and Xinjiang Lu and Hui Xiong", title = "Learning a Hierarchical Intent Model for Next-Item Recommendation", journal = j-TOIS, volume = "40", number = "2", pages = "38:1--38:28", month = apr, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3473972", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Feb 2 08:14:20 MST 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3473972", abstract = "A session-based recommender system (SBRS) captures users' evolving behaviors and recommends the next item by profiling users in terms of items in a session. User intent and user preference are two factors affecting his (her) decisions. Specifically, the \ldots{}", acknowledgement = ack-nhfb, articleno = "38", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Vuong:2022:DMC, author = "Tung Vuong and Salvatore Andolina and Giulio Jacucci and Tuukka Ruotsalo", title = "Does More Context Help? {Effects} of Context Window and Application Source on Retrieval Performance", journal = j-TOIS, volume = "40", number = "2", pages = "39:1--39:40", month = apr, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3474055", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Feb 2 08:14:20 MST 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3474055", abstract = "We study the effect of contextual information obtained from a user's digital trace on Web search performance. Contextual information is modeled using Dirichlet-Hawkes processes (DHP) and used in augmenting Web search queries. The context is captured by \ldots{}", acknowledgement = ack-nhfb, articleno = "39", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Nardini:2022:FFS, author = "Franco Maria Nardini and Roberto Trani and Rossano Venturini", title = "Fast Filtering of Search Results Sorted by Attribute", journal = j-TOIS, volume = "40", number = "2", pages = "40:1--40:24", month = apr, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3477982", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Feb 2 08:14:20 MST 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3477982", abstract = "Modern search services often provide multiple options to rank the search results, e.g., sort ``by relevance'', ``by price'' or ``by discount'' in e-commerce. While the traditional rank by relevance effectively places the relevant results in the top positions of \ldots{}", acknowledgement = ack-nhfb, articleno = "40", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhu:2022:EMM, author = "Lei Zhu and Chaoqun Zheng and Xu Lu and Zhiyong Cheng and Liqiang Nie and Huaxiang Zhang", title = "Efficient Multi-modal Hashing with Online Query Adaption for Multimedia Retrieval", journal = j-TOIS, volume = "40", number = "2", pages = "41:1--41:36", month = apr, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3477180", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Feb 2 08:14:20 MST 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/hash.bib; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3477180", abstract = "Multi-modal hashing supports efficient multimedia retrieval well. However, existing methods still suffer from two problems: (1) Fixed multi-modal fusion. They collaborate the multi-modal features with fixed weights for hash learning, which cannot \ldots{}", acknowledgement = ack-nhfb, articleno = "41", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{He:2022:ISS, author = "Xiangnan He and Zhaochun Ren and Emine Yilmaz and Marc Najork and Tat-Seng Chua", title = "Introduction to the Special Section on Graph Technologies for User Modeling and Recommendation, {Part 2}", journal = j-TOIS, volume = "40", number = "3", pages = "42:1--42:5", month = jul, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3490180", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Apr 1 15:26:39 MDT 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3490180", acknowledgement = ack-nhfb, articleno = "42", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Yao:2022:CAK, author = "Jing Yao and Zhicheng Dou and Ji-Rong Wen", title = "Clarifying Ambiguous Keywords with Personal Word Embeddings for Personalized Search", journal = j-TOIS, volume = "40", number = "3", pages = "43:1--43:29", month = jul, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3470564", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Apr 1 15:26:39 MDT 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3470564", abstract = "Personalized search tailors document ranking lists for each individual user based on her interests and query intent to better satisfy the user's information need. Many personalized search models have been proposed. They first build a user interest profile \ldots{}", acknowledgement = ack-nhfb, articleno = "43", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Xie:2022:DGG, author = "Zhiwen Xie and Runjie Zhu and Kunsong Zhao and Jin Liu and Guangyou Zhou and Jimmy Xiangji Huang", title = "Dual Gated Graph Attention Networks with Dynamic Iterative Training for Cross-Lingual Entity Alignment", journal = j-TOIS, volume = "40", number = "3", pages = "44:1--44:30", month = jul, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3471165", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Apr 1 15:26:39 MDT 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3471165", abstract = "Cross-lingual entity alignment has attracted considerable attention in recent years. Past studies using conventional approaches to match entities share the common problem of missing important structural information beyond entities in the modeling process. \ldots{}", acknowledgement = ack-nhfb, articleno = "44", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Jin:2022:GLI, author = "Jiarui Jin and Kounianhua Du and Weinan Zhang and Jiarui Qin and Yuchen Fang and Yong Yu and Zheng Zhang and Alexander J. Smola", title = "{GraphHINGE}: Learning Interaction Models of Structured Neighborhood on Heterogeneous Information Network", journal = j-TOIS, volume = "40", number = "3", pages = "45:1--45:35", month = jul, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3472956", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Apr 1 15:26:39 MDT 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3472956", abstract = "Heterogeneous information network (HIN) has been widely used to characterize entities of various types and their complex relations. Recent attempts either rely on explicit path reachability to leverage path-based semantic relatedness or graph neighborhood \ldots{}", acknowledgement = ack-nhfb, articleno = "45", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wang:2022:DSR, author = "Lili Wang and Chenghan Huang and Ying Lu and Weicheng Ma and Ruibo Liu and Soroush Vosoughi", title = "Dynamic Structural Role Node Embedding for User Modeling in Evolving Networks", journal = j-TOIS, volume = "40", number = "3", pages = "46:1--46:21", month = jul, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3472955", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Apr 1 15:26:39 MDT 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3472955", abstract = "Complex user behavior, especially in settings such as social media, can be organized as time-evolving networks. Through network embedding, we can extract general-purpose vector representations of these dynamic networks which allow us to analyze them \ldots{}", acknowledgement = ack-nhfb, articleno = "46", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2022:ECF, author = "Ge Zhang and Zhao Li and Jiaming Huang and Jia Wu and Chuan Zhou and Jian Yang and Jianliang Gao", title = "{eFraudCom}: an E-commerce Fraud Detection System via Competitive Graph Neural Networks", journal = j-TOIS, volume = "40", number = "3", pages = "47:1--47:29", month = jul, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3474379", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Apr 1 15:26:39 MDT 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3474379", abstract = "With the development of e-commerce, fraud behaviors have been becoming one of the biggest threats to the e-commerce business. Fraud behaviors seriously damage the ranking system of e-commerce platforms and adversely influence the shopping experience of \ldots{}", acknowledgement = ack-nhfb, articleno = "47", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Xie:2022:GNC, author = "Qianqian Xie and Yutao Zhu and Jimin Huang and Pan Du and Jian-Yun Nie", title = "Graph Neural Collaborative Topic Model for Citation Recommendation", journal = j-TOIS, volume = "40", number = "3", pages = "48:1--48:30", month = jul, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3473973", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Apr 1 15:26:39 MDT 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3473973", abstract = "Due to the overload of published scientific articles, citation recommendation has long been a critical research problem for automatically recommending the most relevant citations of given articles. Relational topic models (RTMs) have shown promise on \ldots{}", acknowledgement = ack-nhfb, articleno = "48", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zeng:2022:MGL, author = "Xingshan Zeng and Jing Li and Lingzhi Wang and Kam-Fai Wong", title = "Modeling Global and Local Interactions for Online Conversation Recommendation", journal = j-TOIS, volume = "40", number = "3", pages = "49:1--49:33", month = jul, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3473970", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Apr 1 15:26:39 MDT 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3473970", abstract = "The popularity of social media platforms results in a huge volume of online conversations produced every day. To help users better engage in online conversations, this article presents a novel framework to automatically recommend conversations to users \ldots{}", acknowledgement = ack-nhfb, articleno = "49", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhu:2022:BHD, author = "Yadong Zhu and Xiliang Wang and Qing Li and Tianjun Yao and Shangsong Liang", title = "{BotSpot++}: a Hierarchical Deep Ensemble Model for Bots Install Fraud Detection in Mobile Advertising", journal = j-TOIS, volume = "40", number = "3", pages = "50:1--50:28", month = jul, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3476107", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Apr 1 15:26:39 MDT 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3476107", abstract = "Mobile advertising has undoubtedly become one of the fastest-growing industries in the world. The influx of capital attracts increasing fraudsters to defraud money from advertisers. Fraudsters can leverage many techniques, where bots install fraud is the \ldots{}", acknowledgement = ack-nhfb, articleno = "50", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhao:2022:TIL, author = "Jiashu Zhao and Jimmy Xiangji Huang and Hongbo Deng and Yi Chang and Long Xia", title = "Are Topics Interesting or Not? {An} {LDA}-based Topic-graph Probabilistic Model for {Web} Search Personalization", journal = j-TOIS, volume = "40", number = "3", pages = "51:1--51:24", month = jul, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3476106", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Apr 1 15:26:39 MDT 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3476106", abstract = "In this article, we propose a Latent Dirichlet Allocation- (LDA) based topic-graph probabilistic personalization model for Web search. This model represents a user graph in a latent topic graph and simultaneously estimates the probabilities that the user \ldots{}", acknowledgement = ack-nhfb, articleno = "51", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Li:2022:SCA, author = "Dan Li and Tong Xu and Peilun Zhou and Weidong He and Yanbin Hao and Yi Zheng and Enhong Chen", title = "Social Context-aware Person Search in Videos via Multi-modal Cues", journal = j-TOIS, volume = "40", number = "3", pages = "52:1--52:25", month = jul, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3480967", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Apr 1 15:26:39 MDT 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3480967", abstract = "Person search has long been treated as a crucial and challenging task to support deeper insight in personalized summarization and personality discovery. Traditional methods, e.g., person re-identification and face recognition techniques, which profile \ldots{}", acknowledgement = ack-nhfb, articleno = "52", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Sen:2022:KWY, author = "Procheta Sen and Debasis Ganguly and Gareth J. F. Jones", title = "{I} Know What You Need: Investigating Document Retrieval Effectiveness with Partial Session Contexts", journal = j-TOIS, volume = "40", number = "3", pages = "53:1--53:30", month = jul, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3488667", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Apr 1 15:26:39 MDT 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3488667", abstract = "Reducing user effort in finding relevant information is one of the key objectives of search systems. Existing approaches have been shown to effectively exploit the context from the current search session of users for automatically suggesting queries to \ldots{}", acknowledgement = ack-nhfb, articleno = "53", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Yan:2022:LTL, author = "Surong Yan and Kwei-Jay Lin and Xiaolin Zheng and Haosen Wang", title = "{LkeRec}: Toward Lightweight End-to-End Joint Representation Learning for Building Accurate and Effective Recommendation", journal = j-TOIS, volume = "40", number = "3", pages = "54:1--54:28", month = jul, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3486673", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Apr 1 15:26:39 MDT 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3486673", abstract = "Explicit and implicit knowledge about users and items have been used to describe complex and heterogeneous side information for recommender systems (RSs). Many existing methods use knowledge graph embedding (KGE) to learn the representation of a user-item \ldots{}", acknowledgement = ack-nhfb, articleno = "54", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Bhoi:2022:PMR, author = "Suman Bhoi and Mong Li Lee and Wynne Hsu and Hao Sen Andrew Fang and Ngiap Chuan Tan", title = "Personalizing Medication Recommendation with a Graph-Based Approach", journal = j-TOIS, volume = "40", number = "3", pages = "55:1--55:23", month = jul, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3488668", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Apr 1 15:26:39 MDT 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3488668", abstract = "The broad adoption of electronic health records (EHRs) has led to vast amounts of data being accumulated on a patient's history, diagnosis, prescriptions, and lab tests. Advances in recommender technologies have the potential to utilize this information \ldots{}", acknowledgement = ack-nhfb, articleno = "55", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Paik:2022:TMP, author = "Jiaul H. Paik and Yash Agrawal and Sahil Rishi and Vaishal Shah", title = "Truncated Models for Probabilistic Weighted Retrieval", journal = j-TOIS, volume = "40", number = "3", pages = "56:1--56:24", month = jul, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3476837", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Apr 1 15:26:39 MDT 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3476837", abstract = "Existing probabilistic retrieval models do not restrict the domain of the random variables that they deal with. In this article, we show that the upper bound of the normalized term frequency ( tf ) from the relevant documents is much smaller than the upper \ldots{}", acknowledgement = ack-nhfb, articleno = "56", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Chen:2022:EHS, author = "Meng Chen and Lei Zhu and Ronghui Xu and Yang Liu and Xiaohui Yu and Yilong Yin", title = "Embedding Hierarchical Structures for Venue Category Representation", journal = j-TOIS, volume = "40", number = "3", pages = "57:1--57:29", month = jul, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3478285", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Apr 1 15:26:39 MDT 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3478285", abstract = "Venue categories used in location-based social networks often exhibit a hierarchical structure, together with the category sequences derived from users' check-ins. The two data modalities provide a wealth of information for us to capture the semantic \ldots{}", acknowledgement = ack-nhfb, articleno = "57", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Fang:2022:HVC, author = "Jinyuan Fang and Shangsong Liang and Zaiqiao Meng and Maarten {De Rijke}", title = "Hyperspherical Variational Co-embedding for Attributed Networks", journal = j-TOIS, volume = "40", number = "3", pages = "58:1--58:36", month = jul, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3478284", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Apr 1 15:26:39 MDT 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3478284", abstract = "Network-based information has been widely explored and exploited in the information retrieval literature. Attributed networks, consisting of nodes, edges as well as attributes describing properties of nodes, are a basic type of network-based data, and are \ldots{}", acknowledgement = ack-nhfb, articleno = "58", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Jayashree:2022:MWP, author = "Srivatsa Ramesh Jayashree and Ga{\"e}l Dias and Judith Jeyafreeda Andrew and Sriparna Saha and Fabrice Maurel and St{\'e}phane Ferrari", title = "Multimodal {Web} Page Segmentation Using Self-organized Multi-objective Clustering", journal = j-TOIS, volume = "40", number = "3", pages = "59:1--59:49", month = jul, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3480966", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Apr 1 15:26:39 MDT 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3480966", abstract = "Web page segmentation (WPS) aims to break a web page into different segments with coherent intra- and inter-semantics. By evidencing the morpho-dispositional semantics of a web page, WPS has traditionally been used to demarcate informative from non-. \ldots{}", acknowledgement = ack-nhfb, articleno = "59", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Moshfeghi:2022:GTA, author = "Yashar Moshfeghi and Alvaro Francisco Huertas-Rosero", title = "A Game Theory Approach for Estimating Reliability of Crowdsourced Relevance Assessments", journal = j-TOIS, volume = "40", number = "3", pages = "60:1--60:29", month = jul, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3480965", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Apr 1 15:26:39 MDT 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3480965", abstract = "In this article, we propose an approach to improve quality in crowdsourcing (CS) tasks using Task Completion Time (TCT) as a source of information about the reliability of workers in a game-theoretical competitive scenario. Our approach is based on the \ldots{}", acknowledgement = ack-nhfb, articleno = "60", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Albahem:2022:CBA, author = "Ameer Albahem and Damiano Spina and Falk Scholer and Lawrence Cavedon", title = "Component-based Analysis of Dynamic Search Performance", journal = j-TOIS, volume = "40", number = "3", pages = "61:1--61:47", month = jul, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3483237", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Apr 1 15:26:39 MDT 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3483237", abstract = "In many search scenarios, such as exploratory, comparative, or survey-oriented search, users interact with dynamic search systems to satisfy multi-aspect information needs. These systems utilize different dynamic approaches that exploit various user \ldots{}", acknowledgement = ack-nhfb, articleno = "61", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Dang:2022:CBT, author = "Edward Kai Fung Dang and Robert Wing Pong Luk and James Allan", title = "A Comparison between Term-Independence Retrieval Models for Ad Hoc Retrieval", journal = j-TOIS, volume = "40", number = "3", pages = "62:1--62:37", month = jul, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3483612", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Apr 1 15:26:39 MDT 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3483612", abstract = "In Information Retrieval, numerous retrieval models or document ranking functions have been developed in the quest for better retrieval effectiveness. Apart from some formal retrieval models formulated on a theoretical basis, various recent works have \ldots{}", acknowledgement = ack-nhfb, articleno = "62", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Sun:2022:UAA, author = "Peijie Sun and Le Wu and Kun Zhang and Yu Su and Meng Wang", title = "An Unsupervised Aspect-Aware Recommendation Model with Explanation Text Generation", journal = j-TOIS, volume = "40", number = "3", pages = "63:1--63:29", month = jul, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3483611", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Apr 1 15:26:39 MDT 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3483611", abstract = "Review based recommendation utilizes both users' rating records and the associated reviews for recommendation. Recently, with the rapid demand for explanations of recommendation results, reviews are used to train the encoder-decoder models for explanation \ldots{}", acknowledgement = ack-nhfb, articleno = "63", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Fang:2022:SRL, author = "Yang Fang and Xiang Zhao and Peixin Huang and Weidong Xiao and Maarten de Rijke", title = "Scalable Representation Learning for Dynamic Heterogeneous Information Networks via Metagraphs", journal = j-TOIS, volume = "40", number = "4", pages = "64:1--64:27", month = oct, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3485189", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 16 10:23:24 MDT 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3485189", abstract = "Content representation is a fundamental task in information retrieval. Representation learning is aimed at capturing features of an information object in a low-dimensional space. Most research on representation learning for heterogeneous information \ldots{}", acknowledgement = ack-nhfb, articleno = "64", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Ji:2022:SAL, author = "Weiyu Ji and Xiangwu Meng and Yujie Zhang", title = "{STARec}: Adaptive Learning with Spatiotemporal and Activity Influence for {POI} Recommendation", journal = j-TOIS, volume = "40", number = "4", pages = "65:1--65:40", month = oct, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3485631", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 16 10:23:24 MDT 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3485631", abstract = "POI recommendation has become an essential means to help people discover attractive places. Intuitively, activities have an important impact on users' decision-making, because users select POIs to attend corresponding activities. However, many existing \ldots{}", acknowledgement = ack-nhfb, articleno = "65", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Guo:2022:SMF, author = "Jiafeng Guo and Yinqiong Cai and Yixing Fan and Fei Sun and Ruqing Zhang and Xueqi Cheng", title = "Semantic Models for the First-Stage Retrieval: a Comprehensive Review", journal = j-TOIS, volume = "40", number = "4", pages = "66:1--66:42", month = oct, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3486250", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 16 10:23:24 MDT 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3486250", abstract = "Multi-stage ranking pipelines have been a practical solution in modern search systems, where the first-stage retrieval is to return a subset of candidate documents and latter stages attempt to re-rank those candidates. Unlike re-ranking stages going \ldots{}", acknowledgement = ack-nhfb, articleno = "66", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Pan:2022:GCA, author = "Zhiqiang Pan and Fei Cai and Wanyu Chen and Honghui Chen", title = "Graph Co-Attentive Session-based Recommendation", journal = j-TOIS, volume = "40", number = "4", pages = "67:1--67:31", month = oct, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3486711", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 16 10:23:24 MDT 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3486711", abstract = "Session-based recommendation aims to generate recommendations merely based on the ongoing session, which is a challenging task. Previous methods mainly focus on modeling the sequential signals or the transition relations between items in the current \ldots{}", acknowledgement = ack-nhfb, articleno = "67", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2022:GTP, author = "Chuxu Zhang and Julia Kiseleva and Sujay Kumar Jauhar and Ryen W. White", title = "Grounded Task Prioritization with Context-Aware Sequential Ranking", journal = j-TOIS, volume = "40", number = "4", pages = "68:1--68:28", month = oct, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3486861", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 16 10:23:24 MDT 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3486861", abstract = "People rely on task management applications and digital assistants to capture and track their tasks, and help with executing them. The burden of organizing and scheduling time for tasks continues to reside with users of these systems, despite the high \ldots{}", acknowledgement = ack-nhfb, articleno = "68", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Peng:2022:RNS, author = "Hao Peng and Ruitong Zhang and Yingtong Dou and Renyu Yang and Jingyi Zhang and Philip S. Yu", title = "Reinforced Neighborhood Selection Guided Multi-Relational Graph Neural Networks", journal = j-TOIS, volume = "40", number = "4", pages = "69:1--69:46", month = oct, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3490181", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 16 10:23:24 MDT 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3490181", abstract = "Graph Neural Networks (GNNs) have been widely used for the representation learning of various structured graph data, typically through message passing among nodes by aggregating their neighborhood information via different operations. While promising, \ldots{}", acknowledgement = ack-nhfb, articleno = "69", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wang:2022:PEE, author = "Chao Wang and Hengshu Zhu and Peng Wang and Chen Zhu and Xi Zhang and Enhong Chen and Hui Xiong", title = "Personalized and Explainable Employee Training Course Recommendations: a {Bayesian} Variational Approach", journal = j-TOIS, volume = "40", number = "4", pages = "70:1--70:32", month = oct, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3490476", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 16 10:23:24 MDT 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3490476", abstract = "As a major component of strategic talent management, learning and development (L\&D) aims at improving the individual and organization performances through planning tailored training for employees to increase and improve their skills and knowledge. While \ldots{}", acknowledgement = ack-nhfb, articleno = "70", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wang:2022:FFM, author = "Jinze Wang and Yongli Ren and Jie Li and Ke Deng", title = "The Footprint of Factorization Models and Their Applications in Collaborative Filtering", journal = j-TOIS, volume = "40", number = "4", pages = "71:1--71:32", month = oct, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3490475", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 16 10:23:24 MDT 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3490475", abstract = "Factorization models have been successfully applied to the recommendation problems and have significant impact to both academia and industries in the field of Collaborative Filtering (CF). However, the intermediate data generated in factorization models' \ldots{}", acknowledgement = ack-nhfb, articleno = "71", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Pan:2022:CGL, author = "Zhiqiang Pan and Fei Cai and Wanyu Chen and Chonghao Chen and Honghui Chen", title = "Collaborative Graph Learning for Session-based Recommendation", journal = j-TOIS, volume = "40", number = "4", pages = "72:1--72:26", month = oct, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3490479", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 16 10:23:24 MDT 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3490479", abstract = "Session-based recommendation (SBR), which mainly relies on a user's limited interactions with items to generate recommendations, is a widely investigated task. Existing methods often apply RNNs or GNNs to model user's sequential behavior or transition \ldots{}", acknowledgement = ack-nhfb, articleno = "72", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wang:2022:CGC, author = "Hongwei Wang and Jure Leskovec", title = "Combining Graph Convolutional Neural Networks and Label Propagation", journal = j-TOIS, volume = "40", number = "4", pages = "73:1--73:27", month = oct, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3490478", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 16 10:23:24 MDT 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3490478", abstract = "Label Propagation Algorithm (LPA) and Graph Convolutional Neural Networks (GCN) are both message passing algorithms on graphs. Both solve the task of node classification, but LPA propagates node label information across the edges of the graph, while GCN \ldots{}", acknowledgement = ack-nhfb, articleno = "73", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Xie:2022:LTI, author = "Zhongwei Xie and Ling Liu and Yanzhao Wu and Luo Zhong and Lin Li", title = "Learning Text-image Joint Embedding for Efficient Cross-modal Retrieval with Deep Feature Engineering", journal = j-TOIS, volume = "40", number = "4", pages = "74:1--74:27", month = oct, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3490519", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 16 10:23:24 MDT 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3490519", abstract = "This article introduces a two-phase deep feature engineering framework for efficient learning of semantics enhanced joint embedding, which clearly separates the deep feature engineering in data preprocessing from training the text-image joint embedding \ldots{}", acknowledgement = ack-nhfb, articleno = "74", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Cheng:2022:FLA, author = "Zhiyong Cheng and Fan Liu and Shenghan Mei and Yangyang Guo and Lei Zhu and Liqiang Nie", title = "Feature-Level Attentive {ICF} for Recommendation", journal = j-TOIS, volume = "40", number = "4", pages = "75:1--75:24", month = oct, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3490477", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 16 10:23:24 MDT 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3490477", abstract = "Item-based collaborative filtering (ICF) enjoys the advantages of high recommendation accuracy and ease in online penalization and thus is favored by the industrial recommender systems. ICF recommends items to a target user based on their similarities to \ldots{}", acknowledgement = ack-nhfb, articleno = "75", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Sakai:2022:RAW, author = "Tetsuya Sakai and Sijie Tao and Zhaohao Zeng", title = "Relevance Assessments for {Web} Search Evaluation: Should We Randomise or Prioritise the Pooled Documents?", journal = j-TOIS, volume = "40", number = "4", pages = "76:1--76:35", month = oct, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3494833", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 16 10:23:24 MDT 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3494833", abstract = "In the context of depth-$k$ pooling for constructing web search test collections, we compare two approaches to ordering pooled documents for relevance assessors: The prioritisation strategy (PRI) used widely at NTCIR, and the simple randomisation strategy \ldots{}", acknowledgement = ack-nhfb, articleno = "76", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Urgo:2022:UPT, author = "Kelsey Urgo and Jaime Arguello", title = "Understanding the {``Pathway''} Towards a Searcher's Learning Objective", journal = j-TOIS, volume = "40", number = "4", pages = "77:1--77:42", month = oct, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3495222", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 16 10:23:24 MDT 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3495222", abstract = "Search systems are often used to support learning-oriented goals. This trend has given rise to the ``search-as-learning'' movement, which proposes that search systems should be designed to support learning. To this end, an important research question is: \ldots{}", acknowledgement = ack-nhfb, articleno = "77", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Yu:2022:SHQ, author = "Weiren Yu and Julie McCann and Chengyuan Zhang and Hakan Ferhatosmanoglu", title = "Scaling High-Quality Pairwise Link-Based Similarity Retrieval on Billion-Edge Graphs", journal = j-TOIS, volume = "40", number = "4", pages = "78:1--78:45", month = oct, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3495209", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 16 10:23:24 MDT 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3495209", abstract = "SimRank is an attractive link-based similarity measure used in fertile fields of Web search and sociometry. However, the existing deterministic method by Kusumoto et al. [ 24 ] for retrieving SimRank does not always produce high-quality similarity results, \ldots{}", acknowledgement = ack-nhfb, articleno = "78", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2022:JPF, author = "Peng Zhang and Baoxi Liu and Tun Lu and Xianghua Ding and Hansu Gu and Ning Gu", title = "Jointly Predicting Future Content in Multiple Social Media Sites Based on Multi-task Learning", journal = j-TOIS, volume = "40", number = "4", pages = "79:1--79:28", month = oct, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3495530", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 16 10:23:24 MDT 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3495530", abstract = "User-generated contents (UGC) in social media are the direct expression of users' interests, preferences, and opinions. User behavior prediction based on UGC has increasingly been investigated in recent years. Compared to learning a person's behavioral \ldots{}", acknowledgement = ack-nhfb, articleno = "79", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Tang:2022:RCI, author = "Zhiwen Tang and Grace Hui Yang", title = "A Re-classification of Information Seeking Tasks and Their Computational Solutions", journal = j-TOIS, volume = "40", number = "4", pages = "80:1--80:32", month = oct, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3497875", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 16 10:23:24 MDT 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3497875", abstract = "This article presents a re-classification of information seeking (IS) tasks, concepts, and algorithms. The proposed taxonomy provides new dimensions to look into information seeking tasks and methods. The new dimensions include number of search iterations,. \ldots{}", acknowledgement = ack-nhfb, articleno = "80", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Frummet:2022:WCC, author = "Alexander Frummet and David Elsweiler and Bernd Ludwig", title = "{``What Can I Cook with these Ingredients?''} --- Understanding Cooking-Related Information Needs in Conversational Search", journal = j-TOIS, volume = "40", number = "4", pages = "81:1--81:32", month = oct, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3498330", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 16 10:23:24 MDT 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3498330", abstract = "As conversational search becomes more pervasive, it becomes increasingly important to understand the users' underlying information needs when they converse with such systems in diverse domains. We conduct an in situ study to understand information needs \ldots{}", acknowledgement = ack-nhfb, articleno = "81", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Li:2022:DGR, author = "Yongqi Li and Wenjie Li and Liqiang Nie", title = "Dynamic Graph Reasoning for Conversational Open-Domain Question Answering", journal = j-TOIS, volume = "40", number = "4", pages = "82:1--82:24", month = oct, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3498557", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 16 10:23:24 MDT 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3498557", abstract = "In recent years, conversational agents have provided a natural and convenient access to useful information in people's daily life, along with a broad and new research topic, conversational question answering (QA). On the shoulders of conversational QA, we \ldots{}", acknowledgement = ack-nhfb, articleno = "82", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Li:2022:MSE, author = "Rui Li and Cheng Yang and Tingwei Li and Sen Su", title = "{MiDTD}: a Simple and Effective Distillation Framework for Distantly Supervised Relation Extraction", journal = j-TOIS, volume = "40", number = "4", pages = "83:1--83:32", month = oct, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3503917", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 16 10:23:24 MDT 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3503917", abstract = "Relation extraction (RE), an important information extraction task, faced the great challenge brought by limited annotation data. To this end, distant supervision was proposed to automatically label RE data, and thus largely increased the number of \ldots{}", acknowledgement = ack-nhfb, articleno = "83", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2022:CVN, author = "Peng Zhang and Wenjie Hui and Benyou Wang and Donghao Zhao and Dawei Song and Christina Lioma and Jakob Grue Simonsen", title = "Complex-valued Neural Network-based Quantum Language Models", journal = j-TOIS, volume = "40", number = "4", pages = "84:1--84:31", month = oct, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3505138", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 16 10:23:24 MDT 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3505138", abstract = "Language modeling is essential in Natural Language Processing and Information Retrieval related tasks. After the statistical language models, Quantum Language Model (QLM) has been proposed to unify both single words and compound terms in the same \ldots{}", acknowledgement = ack-nhfb, articleno = "84", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wang:2022:SMR, author = "Zhenduo Wang and Qingyao Ai", title = "Simulating and Modeling the Risk of Conversational Search", journal = j-TOIS, volume = "40", number = "4", pages = "85:1--85:33", month = oct, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3507357", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 16 10:23:24 MDT 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3507357", abstract = "In conversational search, agents can interact with users by asking clarifying questions to increase their chance of finding better results. Many recent works and shared tasks in both natural language processing and information retrieval communities have \ldots{}", acknowledgement = ack-nhfb, articleno = "85", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhu:2022:LNG, author = "Yutao Zhu and Ruihua Song and Jian-Yun Nie and Pan Du and Zhicheng Dou and Jin Zhou", title = "Leveraging Narrative to Generate Movie Script", journal = j-TOIS, volume = "40", number = "4", pages = "86:1--86:32", month = oct, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3507356", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 16 10:23:24 MDT 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3507356", abstract = "Generating a text based on a predefined guideline is an interesting but challenging problem. A series of studies have been carried out in recent years. In dialogue systems, researchers have explored driving a dialogue based on a plan, while in story \ldots{}", acknowledgement = ack-nhfb, articleno = "86", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Deng:2022:TPA, author = "Yang Deng and Yaliang Li and Wenxuan Zhang and Bolin Ding and Wai Lam", title = "Toward Personalized Answer Generation in E-Commerce via Multi-perspective Preference Modeling", journal = j-TOIS, volume = "40", number = "4", pages = "87:1--87:28", month = oct, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3507782", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 16 10:23:24 MDT 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3507782", abstract = "Recently, Product Question Answering (PQA) on E-Commerce platforms has attracted increasing attention as it can act as an intelligent online shopping assistant and improve the customer shopping experience. Its key function, automatic answer generation for \ldots{}", acknowledgement = ack-nhfb, articleno = "87", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Rahmani:2022:SAI, author = "Hossein A. Rahmani and Mohammad Aliannejadi and Mitra Baratchi and Fabio Crestani", title = "A Systematic Analysis on the Impact of Contextual Information on Point-of-Interest Recommendation", journal = j-TOIS, volume = "40", number = "4", pages = "88:1--88:35", month = oct, year = "2022", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3508478", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 16 10:23:24 MDT 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3508478", abstract = "As the popularity of Location-based Social Networks increases, designing accurate models for Point-of-Interest (POI) recommendation receives more attention. POI recommendation is often performed by incorporating contextual information into previously \ldots{}", acknowledgement = ack-nhfb, articleno = "88", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Lo:2023:CPR, author = "Pei-Chi Lo and Ee-Peng Lim", title = "Contextual Path Retrieval: a Contextual Entity Relation Embedding-based Approach", journal = j-TOIS, volume = "41", number = "1", pages = "1:1--1:??", month = jan, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3502720", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:16 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3502720", abstract = "Contextual path retrieval (CPR) refers to the task of finding contextual path(s) between a pair of entities in a knowledge graph that explains the connection between them in a given context. For this novel retrieval task, we propose the Embedding-based \ldots{}", acknowledgement = ack-nhfb, articleno = "1", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Ling:2023:GRI, author = "Yanxiang Ling and Fei Cai and Jun Liu and Honghui Chen and Maarten de Rijke", title = "Generating Relevant and Informative Questions for Open-Domain Conversations", journal = j-TOIS, volume = "41", number = "1", pages = "2:1--2:??", month = jan, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3510612", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:16 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3510612", abstract = "Recent research has highlighted the importance of mixed-initiative interactions in conversational search. To enable mixed-initiative interactions, information retrieval systems should be able to ask diverse questions, such as information-seeking, \ldots{}", acknowledgement = ack-nhfb, articleno = "2", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zheng:2023:IAD, author = "Zhi Zheng and Chao Wang and Tong Xu and Dazhong Shen and Penggang Qin and Xiangyu Zhao and Baoxing Huai and Xian Wu and Enhong Chen", title = "Interaction-aware Drug Package Recommendation via Policy Gradient", journal = j-TOIS, volume = "41", number = "1", pages = "3:1--3:??", month = jan, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3511020", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:16 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3511020", abstract = "Recent years have witnessed the rapid accumulation of massive electronic medical records, which highly support intelligent medical services such as drug recommendation. However, although there are multiple interaction types between drugs, e.g., synergism \ldots{}", acknowledgement = ack-nhfb, articleno = "3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Ma:2023:KGK, author = "Ting Ma and Longtao Huang and Qianqian Lu and Songlin Hu", title = "{KR-GCN}: Knowledge-Aware Reasoning with Graph Convolution Network for Explainable Recommendation", journal = j-TOIS, volume = "41", number = "1", pages = "4:1--4:??", month = jan, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3511019", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:16 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3511019", abstract = "Incorporating knowledge graphs (KGs) into recommender systems to provide explainable recommendation has attracted much attention recently. The multi-hop paths in KGs can provide auxiliary facts for improving recommendation performance as well as \ldots{}", acknowledgement = ack-nhfb, articleno = "4", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2023:UBS, author = "Junqi Zhang and Yiqun Liu and Jiaxin Mao and Weizhi Ma and Jiazheng Xu and Shaoping Ma and Qi Tian", title = "User Behavior Simulation for Search Result Re-ranking", journal = j-TOIS, volume = "41", number = "1", pages = "5:1--5:??", month = jan, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3511469", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:16 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3511469", abstract = "Result ranking is one of the major concerns for Web search technologies. Most existing methodologies rank search results in descending order of relevance. To model the interactions among search results, reinforcement learning (RL algorithms have been \ldots{})", acknowledgement = ack-nhfb, articleno = "5", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Huang:2023:PET, author = "Liwei Huang and Yutao Ma and Yanbo Liu and Bohong Danny Du and Shuliang Wang and Deyi Li", title = "Position-Enhanced and Time-aware Graph Convolutional Network for Sequential Recommendations", journal = j-TOIS, volume = "41", number = "1", pages = "6:1--6:??", month = jan, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3511700", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:16 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3511700", abstract = "The sequential recommendation (also known as the next-item recommendation), which aims to predict the following item to recommend in a session according to users' historical behavior, plays a critical role in improving session-based recommender systems. \ldots{}", acknowledgement = ack-nhfb, articleno = "6", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Li:2023:HSI, author = "Bing Li and Peng Yang and Hanlin Zhao and Penghui Zhang and Zijian Liu", title = "Hierarchical Sliding Inference Generator for Question-driven Abstractive Answer Summarization", journal = j-TOIS, volume = "41", number = "1", pages = "7:1--7:??", month = jan, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3511891", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:16 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3511891", abstract = "Text summarization on non-factoid question answering (NQA) aims at identifying the core information of redundant answer guidance using questions, which can dramatically improve answer readability and comprehensibility. Most existing approaches focus on \ldots{}", acknowledgement = ack-nhfb, articleno = "7", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Feng:2023:RRP, author = "Chao Feng and Defu Lian and Xiting Wang and Zheng Liu and Xing Xie and Enhong Chen", title = "Reinforcement Routing on Proximity Graph for Efficient Recommendation", journal = j-TOIS, volume = "41", number = "1", pages = "8:1--8:??", month = jan, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3512767", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:16 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3512767", abstract = "We focus on Maximum Inner Product Search (MIPS), which is an essential problem in many machine learning communities. Given a query, MIPS finds the most similar items with the maximum inner products. Methods for Nearest Neighbor Search (NNS) which is \ldots{}", acknowledgement = ack-nhfb, articleno = "8", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Chen:2023:FTG, author = "Xiuying Chen and Mingzhe Li and Shen Gao and Zhangming Chan and Dongyan Zhao and Xin Gao and Xiangliang Zhang and Rui Yan", title = "Follow the Timeline! {Generating} an Abstractive and Extractive Timeline Summary in Chronological Order", journal = j-TOIS, volume = "41", number = "1", pages = "9:1--9:??", month = jan, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3517221", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:16 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3517221", abstract = "Today, timestamped web documents related to a general news query flood the Internet, and timeline summarization targets this concisely by summarizing the evolution trajectory of events along the timeline. Unlike traditional document summarization, \ldots{}", acknowledgement = ack-nhfb, articleno = "9", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Shang:2023:LRT, author = "Yu-Ming Shang and Heyan Huang and Xin Sun and Wei Wei and Xian-Ling Mao", title = "Learning Relation Ties with a Force-Directed Graph in Distant Supervised Relation Extraction", journal = j-TOIS, volume = "41", number = "1", pages = "10:1--10:??", month = jan, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3520082", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:16 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3520082", abstract = "Relation ties, defined as the correlation and mutual exclusion between different relations, are critical for distant supervised relation extraction. Previous studies usually obtain this property by greedily learning the local connections between \ldots{}", acknowledgement = ack-nhfb, articleno = "10", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wang:2023:SRM, author = "Chenyang Wang and Weizhi Ma and Chong Chen and Min Zhang and Yiqun Liu and Shaoping Ma", title = "Sequential Recommendation with Multiple Contrast Signals", journal = j-TOIS, volume = "41", number = "1", pages = "11:1--11:??", month = jan, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3522673", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:16 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3522673", abstract = "Sequential recommendation has become a trending research topic for its capability to capture dynamic user intents based on historical interaction sequence. To train a sequential recommendation model, it is a common practice to optimize the next-item \ldots{}", acknowledgement = ack-nhfb, articleno = "11", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Chen:2023:RNS, author = "Chong Chen and Weizhi Ma and Min Zhang and Chenyang Wang and Yiqun Liu and Shaoping Ma", title = "Revisiting Negative Sampling vs. Non-sampling in Implicit Recommendation", journal = j-TOIS, volume = "41", number = "1", pages = "12:1--12:??", month = jan, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3522672", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:16 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3522672", abstract = "Recommendation systems play an important role in alleviating the information overload issue. Generally, a recommendation model is trained to discern between positive (liked) and negative (disliked) instances for each user. However, under the open-world \ldots{}", acknowledgement = ack-nhfb, articleno = "12", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Tian:2023:CPM, author = "Yuan Tian and Ke Zhou and Dan Pelleg", title = "Characterization and Prediction of Mobile Tasks", journal = j-TOIS, volume = "41", number = "1", pages = "13:1--13:??", month = jan, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3522711", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:16 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3522711", abstract = "Mobile devices have become an increasingly ubiquitous part of our everyday life. We use mobile services to perform a broad range of tasks (e.g., booking travel or conducting remote office work), leading to often lengthy interactions with several distinct \ldots{}", acknowledgement = ack-nhfb, articleno = "13", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Chen:2023:TET, author = "Xu Chen and Ya Zhang and Ivor W. Tsang and Yuangang Pan and Jingchao Su", title = "Toward Equivalent Transformation of User Preferences in Cross Domain Recommendation", journal = j-TOIS, volume = "41", number = "1", pages = "14:1--14:??", month = jan, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3522762", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:16 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3522762", abstract = "Cross domain recommendation (CDR) is one popular research topic in recommender systems. This article focuses on a popular scenario for CDR where different domains share the same set of users but no overlapping items. The majority of recent methods have \ldots{}", acknowledgement = ack-nhfb, articleno = "14", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2023:SDA, author = "Weinan Zhang and Yiming Cui and Kaiyan Zhang and Yifa Wang and Qingfu Zhu and Lingzhi Li and Ting Liu", title = "A Static and Dynamic Attention Framework for Multi Turn Dialogue Generation", journal = j-TOIS, volume = "41", number = "1", pages = "15:1--15:??", month = jan, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3522763", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:16 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3522763", abstract = "Recently, research on open domain dialogue systems have attracted extensive interests of academic and industrial researchers. The goal of an open domain dialogue system is to imitate humans in conversations. Previous works on single turn conversation \ldots{}", acknowledgement = ack-nhfb, articleno = "15", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zou:2023:UMC, author = "Jie Zou and Mohammad Aliannejadi and Evangelos Kanoulas and Maria Soledad Pera and Yiqun Liu", title = "Users Meet Clarifying Questions: Toward a Better Understanding of User Interactions for Search Clarification", journal = j-TOIS, volume = "41", number = "1", pages = "16:1--16:??", month = jan, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3524110", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:16 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3524110", abstract = "The use of clarifying questions (CQs) is a fairly new and useful technique to aid systems in recognizing the intent, context, and preferences behind user queries. Yet, understanding the extent of the effect of CQs on user behavior and the ability to \ldots{}", acknowledgement = ack-nhfb, articleno = "16", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2023:KEA, author = "Yingying Zhang and Xian Wu and Quan Fang and Shengsheng Qian and Changsheng Xu", title = "Knowledge-Enhanced Attributed Multi-Task Learning for Medicine Recommendation", journal = j-TOIS, volume = "41", number = "1", pages = "17:1--17:??", month = jan, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3527662", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:16 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3527662", abstract = "Medicine recommendation systems target to recommend a set of medicines given a set of symptoms which play a crucial role in assisting doctors in their daily clinics. Existing approaches are either rule-based or supervised. However, the former heavily \ldots{}", acknowledgement = ack-nhfb, articleno = "17", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Choi:2023:IKR, author = "Bogeum Choi and Jaime Arguello and Robert Capra and Austin R. Ward", title = "The Influences of a Knowledge Representation Tool on Searchers with Varying Cognitive Abilities", journal = j-TOIS, volume = "41", number = "1", pages = "18:1--18:??", month = jan, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3527661", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:16 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3527661", abstract = "While current systems are effective in helping searchers resolve simple information needs (e.g., fact-finding), they provide less support for searchers working on complex information-seeking tasks. Complex search tasks involve a wide range of (meta). \ldots{}", acknowledgement = ack-nhfb, articleno = "18", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wang:2023:CPT, author = "Hui Wang and Kun Zhou and Xin Zhao and Jingyuan Wang and Ji-Rong Wen", title = "Curriculum Pre-training Heterogeneous Subgraph Transformer for Top-{$N$} Recommendation", journal = j-TOIS, volume = "41", number = "1", pages = "19:1--19:??", month = jan, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3528667", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:16 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3528667", abstract = "To characterize complex and heterogeneous side information in recommender systems, the heterogeneous information network (HIN) has shown superior performance and attracted much research attention. In HIN, the rich entities, relations, and paths can be \ldots{}", acknowledgement = ack-nhfb, articleno = "19", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wan:2023:MCH, author = "Qizhi Wan and Changxuan Wan and Keli Xiao and Rong Hu and Dexi Liu", title = "A Multi-channel Hierarchical Graph Attention Network for Open Event Extraction", journal = j-TOIS, volume = "41", number = "1", pages = "20:1--20:??", month = jan, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3528668", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:16 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3528668", abstract = "Event extraction is an essential task in natural language processing. Although extensively studied, existing work shares issues in three aspects, including (1) the limitations of using original syntactic dependency structure, (2) insufficient \ldots{}", acknowledgement = ack-nhfb, articleno = "20", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Chen:2023:IRI, author = "Haonan Chen and Zhicheng Dou and Qiannan Zhu and Xiaochen Zuo and Ji-Rong Wen", title = "Integrating Representation and Interaction for Context-Aware Document Ranking", journal = j-TOIS, volume = "41", number = "1", pages = "21:1--21:??", month = jan, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3529955", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:16 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3529955", abstract = "Recent studies show that historical behaviors (such as queries and their clicks) contained in a search session can benefit the ranking performance of subsequent queries in the session. Existing neural context-aware ranking models usually rank documents \ldots{}", acknowledgement = ack-nhfb, articleno = "21", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Liang:2023:FSA, author = "Bin Liang and Xiang Li and Lin Gui and Yonghao Fu and Yulan He and Min Yang and Ruifeng Xu", title = "Few-shot Aspect Category Sentiment Analysis via Meta-learning", journal = j-TOIS, volume = "41", number = "1", pages = "22:1--22:??", month = jan, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3529954", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:16 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3529954", abstract = "Existing aspect-based/category sentiment analysis methods have shown great success in detecting sentiment polarity toward a given aspect in a sentence with supervised learning, where the training and inference stages share the same pre-defined set of \ldots{}", acknowledgement = ack-nhfb, articleno = "22", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhao:2023:PGS, author = "Shiwei Zhao and Runze Wu and Jianrong Tao and Manhu Qu and Minghao Zhao and Changjie Fan and Hongke Zhao", title = "{perCLTV}: a General System for Personalized Customer Lifetime Value Prediction in Online Games", journal = j-TOIS, volume = "41", number = "1", pages = "23:1--23:??", month = jan, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3530012", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:16 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3530012", abstract = "Online games make up the largest segment of the booming global game market in terms of revenue as well as players. Unlike games that sell games at one time for profit, online games make money from in-game purchases by a large number of engaged players. \ldots{}", acknowledgement = ack-nhfb, articleno = "23", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wu:2023:PNR, author = "Chuhan Wu and Fangzhao Wu and Yongfeng Huang and Xing Xie", title = "Personalized News Recommendation: Methods and Challenges", journal = j-TOIS, volume = "41", number = "1", pages = "24:1--24:??", month = jan, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3530257", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:16 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3530257", abstract = "Personalized news recommendation is important for users to find interesting news information and alleviate information overload. Although it has been extensively studied over decades and has achieved notable success in improving user experience, there are \ldots{}", acknowledgement = ack-nhfb, articleno = "24", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Gaeta:2023:RQV, author = "Rossano Gaeta and Michele Garetto and Giancarlo Ruffo and Alessandro Flammini", title = "Reconciling the Quality vs Popularity Dichotomy in Online Cultural Markets", journal = j-TOIS, volume = "41", number = "1", pages = "25:1--25:??", month = jan, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3530790", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:16 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3530790", abstract = "We propose a simple model of an idealized online cultural market in which N items, endowed with a hidden quality metric, are recommended to users by a ranking algorithm possibly biased by the current items' popularity. Our goal is to better understand the \ldots{}", acknowledgement = ack-nhfb, articleno = "25", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhao:2023:TAP, author = "Yuyue Zhao and Xiang Wang and Jiawei Chen and Yashen Wang and Wei Tang and Xiangnan He and Haiyong Xie", title = "Time-aware Path Reasoning on Knowledge Graph for Recommendation", journal = j-TOIS, volume = "41", number = "2", pages = "26:1--26:??", month = apr, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3531267", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:18 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3531267", abstract = "Reasoning on knowledge graph (KG) has been studied for explainable recommendation due to its ability of providing explicit explanations. However, current KG-based explainable recommendation methods unfortunately ignore the temporal information (such as \ldots{})", acknowledgement = ack-nhfb, articleno = "26", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Sun:2023:LIE, author = "Kai Sun and Richong Zhang and Samuel Mensah and Yongyi Mao and Xudong Liu", title = "Learning Implicit and Explicit Multi-task Interactions for Information Extraction", journal = j-TOIS, volume = "41", number = "2", pages = "27:1--27:??", month = apr, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3533020", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:18 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3533020", abstract = "Information extraction aims at extracting entities, relations, and so on, in text to support information retrieval systems. To extract information, researchers have considered multitask learning (ML) approaches. The conventional ML approach learns shared \ldots{}", acknowledgement = ack-nhfb, articleno = "27", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2023:KBE, author = "Richong Zhang and Jaein Kim and Jiajie Mei and Yongyi Mao", title = "Knowledge Base Embedding for Sampling-Based Prediction", journal = j-TOIS, volume = "41", number = "2", pages = "28:1--28:??", month = apr, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3533769", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:18 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3533769", abstract = "Each link prediction task requires different degrees of answer diversity. While a link prediction task may expect up to a couple of answers, another may expect nearly a hundred answers. Given this fact, the performance of a link prediction model can be \ldots{}", acknowledgement = ack-nhfb, articleno = "28", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wu:2023:NRM, author = "Chen Wu and Ruqing Zhang and Jiafeng Guo and Yixing Fan and Xueqi Cheng", title = "Are Neural Ranking Models Robust?", journal = j-TOIS, volume = "41", number = "2", pages = "29:1--29:??", month = apr, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3534928", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:18 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3534928", abstract = "Recently, we have witnessed the bloom of neural ranking models in the information retrieval (IR) field. So far, much effort has been devoted to developing effective neural ranking models that can generalize well on new data. There has been less attention \ldots{}", acknowledgement = ack-nhfb, articleno = "29", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Liu:2023:MME, author = "Kang Liu and Feng Xue and Dan Guo and Le Wu and Shujie Li and Richang Hong", title = "{MEGCF}: Multimodal Entity Graph Collaborative Filtering for Personalized Recommendation", journal = j-TOIS, volume = "41", number = "2", pages = "30:1--30:??", month = apr, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3544106", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:18 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3544106", abstract = "In most E-commerce platforms, whether the displayed items trigger the user's interest largely depends on their most eye-catching multimodal content. Consequently, increasing efforts focus on modeling multimodal user preference, and the pressing paradigm \ldots{}", acknowledgement = ack-nhfb, articleno = "30", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Hao:2023:MSB, author = "Bowen Hao and Hongzhi Yin and Jing Zhang and Cuiping Li and Hong Chen", title = "A Multi-strategy-based Pre-training Method for Cold-start Recommendation", journal = j-TOIS, volume = "41", number = "2", pages = "31:1--31:??", month = apr, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3544107", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:18 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3544107", abstract = "The cold-start issue is a fundamental challenge in Recommender Systems. The recent self-supervised learning (SSL) on Graph Neural Networks (GNNs) model, PT-GNN, pre-trains the GNN model to reconstruct the cold-start embeddings and has shown great \ldots{}", acknowledgement = ack-nhfb, articleno = "31", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhao:2023:RSA, author = "Wayne Xin Zhao and Zihan Lin and Zhichao Feng and Pengfei Wang and Ji-Rong Wen", title = "A Revisiting Study of Appropriate Offline Evaluation for Top-{$N$} Recommendation Algorithms", journal = j-TOIS, volume = "41", number = "2", pages = "32:1--32:??", month = apr, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3545796", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:18 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3545796", abstract = "In recommender systems, top- N recommendation is an important task with implicit feedback data. Although the recent success of deep learning largely pushes forward the research on top- N recommendation, there are increasing concerns on appropriate \ldots{}", acknowledgement = ack-nhfb, articleno = "32", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wu:2023:AAE, author = "Hanrui Wu and Jinyi Long and Nuosi Li and Dahai Yu and Michael K. Ng", title = "Adversarial Auto-encoder Domain Adaptation for Cold-start Recommendation with Positive and Negative Hypergraphs", journal = j-TOIS, volume = "41", number = "2", pages = "33:1--33:??", month = apr, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3544105", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:18 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3544105", abstract = "This article presents a novel model named Adversarial Auto-encoder Domain Adaptation to handle the recommendation problem under cold-start settings. Specifically, we divide the hypergraph into two hypergraphs, i.e., a positive hypergraph and a negative \ldots{}", acknowledgement = ack-nhfb, articleno = "33", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Qin:2023:GGD, author = "Xubo Qin and Zhicheng Dou and Yutao Zhu and Ji-Rong Wen", title = "{GDESA}: Greedy Diversity Encoder with Self-attention for Search Results Diversification", journal = j-TOIS, volume = "41", number = "2", pages = "34:1--34:??", month = apr, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3544103", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:18 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3544103", abstract = "Search result diversification aims to generate diversified search results so as to meet the various information needs of users. Most of those existing diversification methods greedily select the optimal documents one-by-one comparing with the selected \ldots{}", acknowledgement = ack-nhfb, articleno = "34", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2023:PPP, author = "Peng-Fei Zhang and Guangdong Bai and Hongzhi Yin and Zi Huang", title = "Proactive Privacy-preserving Learning for Cross-modal Retrieval", journal = j-TOIS, volume = "41", number = "2", pages = "35:1--35:??", month = apr, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3545799", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:18 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3545799", abstract = "Deep cross-modal retrieval techniques have recently achieved remarkable performance, which also poses severe threats to data privacy potentially. Nowadays, enormous user-generated contents that convey personal information are released and shared on the \ldots{}", acknowledgement = ack-nhfb, articleno = "35", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Moreo:2023:GFE, author = "Alejandro Moreo and Andrea Pedrotti and Fabrizio Sebastiani", title = "Generalized Funnelling: Ensemble Learning and Heterogeneous Document Embeddings for Cross-Lingual Text Classification", journal = j-TOIS, volume = "41", number = "2", pages = "36:1--36:??", month = apr, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3544104", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:18 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3544104", abstract = "Funnelling (Fun) is a recently proposed method for cross-lingual text classification (CLTC) based on a two-tier learning ensemble for heterogeneous transfer learning (HTL). In this ensemble method, 1st-tier classifiers, each working on a different and \ldots{}", acknowledgement = ack-nhfb, articleno = "36", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zheng:2023:SAK, author = "Jianming Zheng and Fei Cai and Yanxiang Ling and Honghui Chen", title = "Sequence-aware Knowledge Distillation for a Lightweight Event Representation", journal = j-TOIS, volume = "41", number = "2", pages = "37:1--37:??", month = apr, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3545798", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:18 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3545798", abstract = "Event representation targets to model the event-reasoning process as a machine-readable format. Previous studies on event representation mostly concentrate on a sole modeling perspective and have not well investigated the scenario-level knowledge, which \ldots{}", acknowledgement = ack-nhfb, articleno = "37", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Datta:2023:RIG, author = "Suchana Datta and Debasis Ganguly and Mandar Mitra and Derek Greene", title = "A Relative Information Gain-based Query Performance Prediction Framework with Generated Query Variants", journal = j-TOIS, volume = "41", number = "2", pages = "38:1--38:??", month = apr, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3545112", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:18 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3545112", abstract = "Query performance prediction (QPP) methods, which aim to predict the performance of a query, often rely on evidences in the form of different characteristic patterns in the distribution of Retrieval Status Values (RSVs). However, for neural IR models, it \ldots{}", acknowledgement = ack-nhfb, articleno = "38", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2023:MML, author = "Hang Zhang and Yajun Yang and Xin Wang and Hong Gao and Qinghua Hu", title = "{MLI}: a Multi-level Inference Mechanism for User Attributes in Social Networks", journal = j-TOIS, volume = "41", number = "2", pages = "39:1--39:??", month = apr, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3545797", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:18 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3545797", abstract = "In the social network, each user has attributes for self-description called user attributes, which are semantically hierarchical. Attribute inference has become an essential way for social platforms to realize user classifications and targeted \ldots{}", acknowledgement = ack-nhfb, articleno = "39", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Lin:2023:GFR, author = "Zhaohao Lin and Weike Pan and Qiang Yang and Zhong Ming", title = "A Generic Federated Recommendation Framework via Fake Marks and Secret Sharing", journal = j-TOIS, volume = "41", number = "2", pages = "40:1--40:??", month = apr, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3548456", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:18 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3548456", abstract = "With the implementation of privacy protection laws such as GDPR, it is increasingly difficult for organizations to legally collect users' data. However, a typical machine learning-based recommendation algorithm requires the data to learn users' \ldots{}", acknowledgement = ack-nhfb, articleno = "40", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Cheng:2023:CSH, author = "Lizhi Cheng and Weijia Jia and Wenmian Yang", title = "Capture Salient Historical Information: a Fast and Accurate Non-autoregressive Model for Multi-turn Spoken Language Understanding", journal = j-TOIS, volume = "41", number = "2", pages = "41:1--41:??", month = apr, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3545800", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:18 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3545800", abstract = "Spoken Language Understanding (SLU), a core component of the task-oriented dialogue system, expects a shorter inference facing the impatience of human users. Existing work increases inference speed by designing non-autoregressive models for single-turn \ldots{}", acknowledgement = ack-nhfb, articleno = "41", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zang:2023:SCD, author = "Tianzi Zang and Yanmin Zhu and Haobing Liu and Ruohan Zhang and Jiadi Yu", title = "A Survey on Cross-domain Recommendation: Taxonomies, Methods, and Future Directions", journal = j-TOIS, volume = "41", number = "2", pages = "42:1--42:??", month = apr, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3548455", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:18 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3548455", abstract = "Traditional recommendation systems are faced with two long-standing obstacles, namely data sparsity and cold-start problems, which promote the emergence and development of Cross-Domain Recommendation (CDR). The core idea of CDR is to leverage information \ldots{}", acknowledgement = ack-nhfb, articleno = "42", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wang:2023:AGP, author = "Yiqi Wang and Chaozhuo Li and Zheng Liu and Mingzheng Li and Jiliang Tang and Xing Xie and Lei Chen and Philip S. Yu", title = "An Adaptive Graph Pre-training Framework for Localized Collaborative Filtering", journal = j-TOIS, volume = "41", number = "2", pages = "43:1--43:??", month = apr, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3555372", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:18 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3555372", abstract = "Graph neural networks (GNNs) have been widely applied in the recommendation tasks and have achieved very appealing performance. However, most GNN-based recommendation methods suffer from the problem of data sparsity in practice. Meanwhile, pre-training \ldots{}", acknowledgement = ack-nhfb, articleno = "43", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Huang:2023:PGH, author = "Zhenya Huang and Binbin Jin and Hongke Zhao and Qi Liu and Defu Lian and Bao Tengfei and Enhong Chen", title = "Personal or General? {A} Hybrid Strategy with Multi-factors for News Recommendation", journal = j-TOIS, volume = "41", number = "2", pages = "44:1--44:??", month = apr, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3555373", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:18 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3555373", abstract = "News recommender systems have become an effective manner to help users make decisions by suggesting the potential news that users may click and read, which has shown the proliferation nowadays. Many representative algorithms made great efforts to discover \ldots{}", acknowledgement = ack-nhfb, articleno = "44", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zou:2023:LAC, author = "Jie Zou and Jimmy Huang and Zhaochun Ren and Evangelos Kanoulas", title = "Learning to Ask: Conversational Product Search via Representation Learning", journal = j-TOIS, volume = "41", number = "2", pages = "45:1--45:??", month = apr, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3555371", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:18 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3555371", abstract = "Online shopping platforms, such as Amazon and AliExpress, are increasingly prevalent in society, helping customers purchase products conveniently. With recent progress in natural language processing, researchers and practitioners shift their focus from \ldots{}", acknowledgement = ack-nhfb, articleno = "45", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Liu:2023:FUM, author = "Qi Liu and Jinze Wu and Zhenya Huang and Hao Wang and Yuting Ning and Ming Chen and Enhong Chen and Jinfeng Yi and Bowen Zhou", title = "Federated User Modeling from Hierarchical Information", journal = j-TOIS, volume = "41", number = "2", pages = "46:1--46:??", month = apr, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3560485", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:18 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3560485", abstract = "The generation of large amounts of personal data provides data centers with sufficient resources to mine idiosyncrasy from private records. User modeling has long been a fundamental task with the goal of capturing the latent characteristics of users from \ldots{}", acknowledgement = ack-nhfb, articleno = "46", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wu:2023:MOO, author = "Haolun Wu and Chen Ma and Bhaskar Mitra and Fernando Diaz and Xue Liu", title = "A Multi-Objective Optimization Framework for Multi-Stakeholder Fairness-Aware Recommendation", journal = j-TOIS, volume = "41", number = "2", pages = "47:1--47:??", month = apr, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3564285", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:18 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3564285", abstract = "Nowadays, most online services are hosted on multi-stakeholder marketplaces, where consumers and producers may have different objectives. Conventional recommendation systems, however, mainly focus on maximizing consumers' satisfaction by recommending the \ldots{}", acknowledgement = ack-nhfb, articleno = "47", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Lu:2023:UPR, author = "Hongyu Lu and Weizhi Ma and Yifan Wang and Min Zhang and Xiang Wang and Yiqun Liu and Tat-Seng Chua and Shaoping Ma", title = "User Perception of Recommendation Explanation: Are Your Explanations What Users Need?", journal = j-TOIS, volume = "41", number = "2", pages = "48:1--48:??", month = apr, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3565480", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:18 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3565480", abstract = "As recommender systems become increasingly important in daily human decision-making, users are demanding convincing explanations to understand why they get the specific recommendation results. Although a number of explainable recommender systems have \ldots{}", acknowledgement = ack-nhfb, articleno = "48", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Rizzo:2023:RMT, author = "Stefano Giovanni Rizzo and Matteo Brucato and Danilo Montesi", title = "Ranking Models for the Temporal Dimension of Text", journal = j-TOIS, volume = "41", number = "2", pages = "49:1--49:??", month = apr, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3565481", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:18 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3565481", abstract = "Temporal features of text have been shown to improve clustering and organization of documents, text classification, visualization, and ranking. Temporal ranking models consider the temporal expressions found in text (e.g., ``in 2021'' or ``last year'') as \ldots{}", acknowledgement = ack-nhfb, articleno = "49", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Fei:2023:RAB, author = "Hao Fei and Tat-Seng Chua and Chenliang Li and Donghong Ji and Meishan Zhang and Yafeng Ren", title = "On the Robustness of Aspect-based Sentiment Analysis: Rethinking Model, Data, and Training", journal = j-TOIS, volume = "41", number = "2", pages = "50:1--50:??", month = apr, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3564281", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Mon May 1 07:56:18 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3564281", abstract = "Aspect-based sentiment analysis (ABSA) aims at automatically inferring the specific sentiment polarities toward certain aspects of products or services behind the social media texts or reviews, which has been a fundamental application to the real-world \ldots{}", acknowledgement = ack-nhfb, articleno = "50", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Yin:2023:TRSa, author = "Hongzhi Yin and Yizhou Sun and Guandong Xu and Evangelos Kanoulas", title = "Trustworthy Recommendation and Search: Introduction to the Special Issue --- {Part 1}", journal = j-TOIS, volume = "41", number = "3", pages = "51:1--51:??", month = jul, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3579995", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 9 08:43:56 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3579995", acknowledgement = ack-nhfb, articleno = "51", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wang:2023:SFR, author = "Yifan Wang and Weizhi Ma and Min Zhang and Yiqun Liu and Shaoping Ma", title = "A Survey on the Fairness of Recommender Systems", journal = j-TOIS, volume = "41", number = "3", pages = "52:1--52:??", month = jul, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3547333", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 9 08:43:56 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3547333", abstract = "Recommender systems are an essential tool to relieve the information overload challenge and play an important role in people's daily lives. Since recommendations \ldots{}", acknowledgement = ack-nhfb, articleno = "52", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{He:2023:ACF, author = "Xiangnan He and Yang Zhang and Fuli Feng and Chonggang Song and Lingling Yi and Guohui Ling and Yongdong Zhang", title = "Addressing Confounding Feature Issue for Causal Recommendation", journal = j-TOIS, volume = "41", number = "3", pages = "53:1--53:??", month = jul, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3559757", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 9 08:43:56 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3559757", abstract = "In recommender systems, some features directly affect whether an interaction would happen, making the happened interactions not necessarily indicate user \ldots{}", acknowledgement = ack-nhfb, articleno = "53", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhu:2023:EQB, author = "Lei Zhu and Tianshi Wang and Jingjing Li and Zheng Zhang and Jialie Shen and Xinhua Wang", title = "Efficient Query-based Black-box Attack against Cross-modal Hashing Retrieval", journal = j-TOIS, volume = "41", number = "3", pages = "54:1--54:??", month = jul, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3559758", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 9 08:43:56 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/hash.bib; https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3559758", abstract = "Deep cross-modal hashing retrieval models inherit the vulnerability of deep neural networks. They are vulnerable to adversarial attacks, especially for the form of subtle perturbations to the inputs. Although many adversarial attack methods have been proposed to handle the robustness of hashing retrieval models, they still suffer from two problems: (1) Most of them are based on the white-box settings, which is usually unrealistic in practical application. (2) Iterative optimization for the generation of adversarial examples in them results in heavy computation. To address these problems, we propose an Efficient Query-based Black-Box Attack (EQB$^2$A) against deep cross-modal hashing retrieval, which can efficiently generate adversarial examples for the black-box attack. Specifically, by sending a few query requests to the attacked retrieval system, the cross-modal retrieval model stealing is performed based on the neighbor relationship between the retrieved results and the query, thus obtaining the knockoffs to substitute the attacked system. A multi-modal knockoffs-driven adversarial generation is proposed to achieve efficient adversarial example generation. While the entire network training converges, EQB2A can efficiently generate adversarial examples by forward-propagation with only given benign images. Experiments show that EQB2A achieves superior attacking performance under the black-box setting.", acknowledgement = ack-nhfb, articleno = "54", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Liu:2023:MPB, author = "Zhongzhou Liu and Yuan Fang and Min Wu", title = "Mitigating Popularity Bias for Users and Items with Fairness-centric Adaptive Recommendation", journal = j-TOIS, volume = "41", number = "3", pages = "55:1--55:??", month = jul, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3564286", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 9 08:43:56 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3564286", abstract = "Recommendation systems are popular in many domains. Researchers usually focus on the effectiveness of recommendation (e.g., precision) but neglect the \ldots{}", acknowledgement = ack-nhfb, articleno = "55", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Dong:2023:DPD, author = "Xue Dong and Xuemeng Song and Na Zheng and Yinwei Wei and Zhongzhou Zhao", title = "Dual Preference Distribution Learning for Item Recommendation", journal = j-TOIS, volume = "41", number = "3", pages = "56:1--56:??", month = jul, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3565798", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 9 08:43:56 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3565798", abstract = "Recommender systems can automatically recommend users with items that they probably like. The goal of them is to model the user-item interaction by \ldots{}", acknowledgement = ack-nhfb, articleno = "56", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Xin:2023:UBL, author = "Xin Xin and Jiyuan Yang and Hanbing Wang and Jun Ma and Pengjie Ren and Hengliang Luo and Xinlei Shi and Zhumin Chen and Zhaochun Ren", title = "On the User Behavior Leakage from Recommender System Exposure", journal = j-TOIS, volume = "41", number = "3", pages = "57:1--57:??", month = jul, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3568954", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 9 08:43:56 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3568954", abstract = "Modern recommender systems are trained to predict users' potential future interactions from users' historical behavior data. During the interaction process, despite \ldots{}", acknowledgement = ack-nhfb, articleno = "57", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Thanh:2023:PGB, author = "Toan Nguyen Thanh and Nguyen Duc Khang Quach and Thanh Tam Nguyen and Thanh Trung Huynh and Viet Hung Vu and Phi Le Nguyen and Jun Jo and Quoc Viet Hung Nguyen", title = "Poisoning {GNN}-based Recommender Systems with Generative Surrogate-based Attacks", journal = j-TOIS, volume = "41", number = "3", pages = "58:1--58:??", month = jul, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3567420", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 9 08:43:56 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3567420", abstract = "With recent advancements in graph neural networks (GNN), GNN-based recommender systems (gRS) have achieved remarkable success in the past few years. \ldots{}", acknowledgement = ack-nhfb, articleno = "58", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Ye:2023:TRN, author = "Haibo Ye and Xinjie Li and Yuan Yao and Hanghang Tong", title = "Towards Robust Neural Graph Collaborative Filtering via Structure Denoising and Embedding Perturbation", journal = j-TOIS, volume = "41", number = "3", pages = "59:1--59:??", month = jul, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3568396", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 9 08:43:56 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3568396", abstract = "Neural graph collaborative filtering has received great recent attention due to its power of encoding the high-order neighborhood via the backbone \ldots{}", acknowledgement = ack-nhfb, articleno = "59", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Chen:2023:SID, author = "Ziqian Chen and Fei Sun and Yifan Tang and Haokun Chen and Jinyang Gao and Bolin Ding", title = "Studying the Impact of Data Disclosure Mechanism in Recommender Systems via Simulation", journal = j-TOIS, volume = "41", number = "3", pages = "60:1--60:??", month = jul, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3569452", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 9 08:43:56 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3569452", abstract = "Recently, privacy issues in web services that rely on users' personal data have raised great attention. Despite that recent regulations force companies to offer choices \ldots{}", acknowledgement = ack-nhfb, articleno = "60", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Oosterhuis:2023:DRE, author = "Harrie Oosterhuis", title = "Doubly Robust Estimation for Correcting Position Bias in Click Feedback for Unbiased Learning to Rank", journal = j-TOIS, volume = "41", number = "3", pages = "61:1--61:??", month = jul, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3569453", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 9 08:43:56 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3569453", abstract = "Clicks on rankings suffer from position bias: generally items on lower ranks are less likely to be examined-and thus clicked-by users, in spite of their actual preferences \ldots{}", acknowledgement = ack-nhfb, articleno = "61", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Li:2023:PRF, author = "Hang Li and Ahmed Mourad and Shengyao Zhuang and Bevan Koopman and Guido Zuccon", title = "Pseudo Relevance Feedback with Deep Language Models and Dense Retrievers: Successes and Pitfalls", journal = j-TOIS, volume = "41", number = "3", pages = "62:1--62:??", month = jul, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3570724", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 9 08:43:56 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3570724", abstract = "Pseudo Relevance Feedback (PRF) is known to improve the effectiveness of bag-of-words retrievers. At the same time, deep language models have been shown \ldots{}", acknowledgement = ack-nhfb, articleno = "62", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Guo:2023:PHG, author = "Naicheng Guo and Xiaolei Liu and Shaoshuai Li and Qiongxu Ma and Kaixin Gao and Bing Han and Lin Zheng and Sheng Guo and Xiaobo Guo", title = "{Poincar{\'e}} Heterogeneous Graph Neural Networks for Sequential Recommendation", journal = j-TOIS, volume = "41", number = "3", pages = "63:1--63:??", month = jul, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3568395", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 9 08:43:56 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3568395", abstract = "Sequential recommendation (SR) learns users' preferences by capturing the sequential patterns from users' behaviors evolution. As discussed in many \ldots{}", acknowledgement = ack-nhfb, articleno = "63", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Cai:2023:UCS, author = "Desheng Cai and Shengsheng Qian and Quan Fang and Jun Hu and Changsheng Xu", title = "User Cold-Start Recommendation via Inductive Heterogeneous Graph Neural Network", journal = j-TOIS, volume = "41", number = "3", pages = "64:1--64:??", month = jul, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3560487", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 9 08:43:56 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3560487", abstract = "Recently, user cold-start recommendations have attracted a lot of attention from industry and academia. In user cold-start recommendation systems, the user \ldots{}", acknowledgement = ack-nhfb, articleno = "64", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Imran:2023:RRE, author = "Mubashir Imran and Hongzhi Yin and Tong Chen and Quoc Viet Hung Nguyen and Alexander Zhou and Kai Zheng", title = "{ReFRS}: Resource-efficient Federated Recommender System for Dynamic and Diversified User Preferences", journal = j-TOIS, volume = "41", number = "3", pages = "65:1--65:??", month = jul, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3560486", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 9 08:43:56 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3560486", abstract = "Owing to its nature of scalability and privacy by design, federated learning (FL) has received increasing interest in decentralized deep learning. FL has also \ldots{}", acknowledgement = ack-nhfb, articleno = "65", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Long:2023:DCL, author = "Jing Long and Tong Chen and Quoc Viet Hung Nguyen and Hongzhi Yin", title = "Decentralized Collaborative Learning Framework for Next {POI} Recommendation", journal = j-TOIS, volume = "41", number = "3", pages = "66:1--66:??", month = jul, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3555374", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 9 08:43:56 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3555374", abstract = "Next Point-of-Interest (POI) recommendation has become an indispensable functionality in Location-based Social Networks (LBSNs) due \ldots{}", acknowledgement = ack-nhfb, articleno = "66", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Chen:2023:BDR, author = "Jiawei Chen and Hande Dong and Xiang Wang and Fuli Feng and Meng Wang and Xiangnan He", title = "Bias and Debias in Recommender System: a Survey and Future Directions", journal = j-TOIS, volume = "41", number = "3", pages = "67:1--67:??", month = jul, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3564284", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 9 08:43:56 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3564284", abstract = "While recent years have witnessed a rapid growth of research papers on recommender system (RS), most of the papers focus on inventing machine learning \ldots{}", acknowledgement = ack-nhfb, articleno = "67", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Song:2023:SPF, author = "Haoyu Song and Wei-Nan Zhang and Kaiyan Zhang and Ting Liu", title = "A Stack-Propagation Framework for Low-Resource Personalized Dialogue Generation", journal = j-TOIS, volume = "41", number = "3", pages = "68:1--68:??", month = jul, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3563389", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 9 08:43:56 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3563389", abstract = "With the resurgent interest in building open-domain dialogue systems, the dialogue generation task has attracted increasing attention over the past few years. \ldots{}", acknowledgement = ack-nhfb, articleno = "68", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Shen:2023:RWC, author = "Yanyan Shen and Lifan Zhao and Weiyu Cheng and Zibin Zhang and Wenwen Zhou and Lin Kangyi", title = "{RESUS}: Warm-up Cold Users via Meta-learning Residual User Preferences in {CTR} Prediction", journal = j-TOIS, volume = "41", number = "3", pages = "69:1--69:??", month = jul, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3564283", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 9 08:43:56 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3564283", abstract = "Click-through Rate (CTR) prediction on cold users is a challenging task in recommender systems. Recent researches have resorted to meta-learning to tackle the \ldots{}", acknowledgement = ack-nhfb, articleno = "69", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Liang:2023:ETA, author = "Bi Liang and Xiangwu Meng and Yujie Zhang", title = "Exploring Time-aware Multi-pattern Group Venue Recommendation in {LBSNs}", journal = j-TOIS, volume = "41", number = "3", pages = "70:1--70:??", month = jul, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3564280", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 9 08:43:56 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3564280", abstract = "Location-based social networks (LBSNs) have become a popular platform for users to share their activities with friends and families, which provide abundant \ldots{}", acknowledgement = ack-nhfb, articleno = "70", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Ma:2023:ITB, author = "Muyang Ma and Pengjie Ren and Zhumin Chen and Zhaochun Ren and Huasheng Liang and Jun Ma and Maarten {De Rijke}", title = "Improving Transformer-based Sequential Recommenders through Preference Editing", journal = j-TOIS, volume = "41", number = "3", pages = "71:1--71:??", month = jul, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3564282", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 9 08:43:56 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3564282", abstract = "One of the key challenges in sequential recommendation is how to extract and represent user preferences. Traditional methods rely solely on predicting \ldots{}", acknowledgement = ack-nhfb, articleno = "71", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Han:2023:DDA, author = "Lei Han and Tianwa Chen and Gianluca Demartini and Marta Indulska and Shazia Sadiq", title = "A Data-Driven Analysis of Behaviors in Data Curation Processes", journal = j-TOIS, volume = "41", number = "3", pages = "72:1--72:??", month = jul, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3567419", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 9 08:43:56 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3567419", abstract = "Understanding how data workers interact with data, and various pieces of information related to data preparation, is key to designing systems that can better \ldots{}", acknowledgement = ack-nhfb, articleno = "72", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Li:2023:PSK, author = "Minghan Li and Diana Nicoleta Popa and Johan Chagnon and Yagmur Gizem Cinar and Eric Gaussier", title = "The Power of Selecting Key Blocks with Local Pre-ranking for Long Document Information Retrieval", journal = j-TOIS, volume = "41", number = "3", pages = "73:1--73:??", month = jul, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3568394", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 9 08:43:56 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3568394", abstract = "On a wide range of natural language processing and information retrieval tasks, transformer-based models, particularly pre-trained language models like \ldots{}", acknowledgement = ack-nhfb, articleno = "73", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Liu:2023:GNP, author = "Siwei Liu and Zaiqiao Meng and Craig Macdonald and Iadh Ounis", title = "Graph Neural Pre-training for Recommendation with Side Information", journal = j-TOIS, volume = "41", number = "3", pages = "74:1--74:??", month = jul, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3568953", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 9 08:43:56 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3568953", abstract = "Leveraging the side information associated with entities (i.e., users and items) to enhance recommendation systems has been widely recognized as an essential \ldots{}", acknowledgement = ack-nhfb, articleno = "74", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Ji:2023:CSD, author = "Yitong Ji and Aixin Sun and Jie Zhang and Chenliang Li", title = "A Critical Study on Data Leakage in Recommender System Offline Evaluation", journal = j-TOIS, volume = "41", number = "3", pages = "75:1--75:??", month = jul, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3569930", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 9 08:43:56 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3569930", abstract = "Recommender models are hard to evaluate, particularly under offline setting. In this article, we provide a comprehensive and critical analysis of the data leakage \ldots{}", acknowledgement = ack-nhfb, articleno = "75", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Shao:2023:URJ, author = "Yunqiu Shao and Yueyue Wu and Yiqun Liu and Jiaxin Mao and Shaoping Ma", title = "Understanding Relevance Judgments in Legal Case Retrieval", journal = j-TOIS, volume = "41", number = "3", pages = "76:1--76:??", month = jul, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3569929", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 9 08:43:56 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3569929", abstract = "Legal case retrieval, which aims to retrieve relevant cases given a query case, has drawn increasing research attention in recent years. While much research has worked \ldots{}", acknowledgement = ack-nhfb, articleno = "76", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Deng:2023:UMT, author = "Yang Deng and Wenxuan Zhang and Weiwen Xu and Wenqiang Lei and Tat-Seng Chua and Wai Lam", title = "A Unified Multi-task Learning Framework for Multi-goal Conversational Recommender Systems", journal = j-TOIS, volume = "41", number = "3", pages = "77:1--77:??", month = jul, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3570640", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 9 08:43:56 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3570640", abstract = "Recent years witnessed several advances in developing multi-goal conversational recommender systems (MG-CRS) that can proactively attract users' interests \ldots{}", acknowledgement = ack-nhfb, articleno = "77", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhao:2023:MUR, author = "Yu Zhao and Qiang Xu and Ying Zou and Wei Li", title = "Modeling User Reviews through {Bayesian} Graph Attention Networks for Recommendation", journal = j-TOIS, volume = "41", number = "3", pages = "78:1--78:??", month = jul, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3570500", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 9 08:43:56 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3570500", abstract = "Recommender systems relieve users from cognitive overloading by predicting preferred items for users. Due to the complexity of interactions between users and \ldots{}", acknowledgement = ack-nhfb, articleno = "78", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Yan:2023:AHP, author = "Ming Yan and Haiyang Xu and Chenliang Li and Junfeng Tian and Bin Bi and Wei Wang and Xianzhe Xu and Ji Zhang and Songfang Huang and Fei Huang and Luo Si and Rong Jin", title = "Achieving Human Parity on Visual Question Answering", journal = j-TOIS, volume = "41", number = "3", pages = "79:1--79:??", month = jul, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3572833", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 9 08:43:56 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3572833", abstract = "The Visual Question Answering (VQA) task utilizes both visual image and language analysis to answer a textual question with respect to an image. It has been a \ldots{}", acknowledgement = ack-nhfb, articleno = "79", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Li:2023:PAG, author = "Yakun Li and Lei Hou and Juanzi Li", title = "Preference-aware Graph Attention Networks for Cross-Domain Recommendations with Collaborative Knowledge Graph", journal = j-TOIS, volume = "41", number = "3", pages = "80:1--80:??", month = jul, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3576921", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 9 08:43:56 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3576921", abstract = "Knowledge graphs (KGs) can provide users with semantic information and relations among numerous entities and nodes, which can greatly facilitate the \ldots{}", acknowledgement = ack-nhfb, articleno = "80", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2023:RGB, author = "Yi Zhang and Yiwen Zhang and Dengcheng Yan and Shuiguang Deng and Yun Yang", title = "Revisiting Graph-based Recommender Systems from the Perspective of Variational Auto-Encoder", journal = j-TOIS, volume = "41", number = "3", pages = "81:1--81:??", month = jul, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3573385", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 9 08:43:56 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3573385", abstract = "Graph-based recommender system has attracted widespread attention and produced a series of research results. Because of the powerful high-order connection \ldots{}", acknowledgement = ack-nhfb, articleno = "81", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Yin:2023:TRSb, author = "Hongzhi Yin and Yizhou Sun and Guandong Xu and Evangelos Kanoulas", title = "Trustworthy Recommendation and Search: Introduction to the Special Section --- {Part 2}", journal = j-TOIS, volume = "41", number = "4", pages = "82:1--82:??", month = oct, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3604776", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Sep 20 08:21:57 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3604776", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "82", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhou:2023:EHT, author = "Yuchen Zhou and Yanan Cao and Yanmin Shang and Chuan Zhou and Shirui Pan and Zheng Lin and Qian Li", title = "Explainable Hyperbolic Temporal Point Process for User-Item Interaction Sequence Generation", journal = j-TOIS, volume = "41", number = "4", pages = "83:1--83:??", month = oct, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3570501", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Sep 20 08:21:57 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3570501", abstract = "Recommender systems which captures dynamic user interest based on time-ordered user-item interactions plays a critical role in the real-world. \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "83", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Deffayet:2023:ERC, author = "Romain Deffayet and Jean-Michel Renders and Maarten de Rijke", title = "Evaluating the Robustness of Click Models to Policy Distributional Shift", journal = j-TOIS, volume = "41", number = "4", pages = "84:1--84:??", month = oct, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3569086", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Sep 20 08:21:57 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3569086", abstract = "Many click models have been proposed to interpret logs of natural interactions with search engines and extract unbiased information for evaluation or \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "84", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Guo:2023:DRL, author = "Xiaobo Guo and Shaoshuai Li and Naicheng Guo and Jiangxia Cao and Xiaolei Liu and Qiongxu Ma and Runsheng Gan and Yunan Zhao", title = "Disentangled Representations Learning for Multi-target Cross-domain Recommendation", journal = j-TOIS, volume = "41", number = "4", pages = "85:1--85:??", month = oct, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3572835", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Sep 20 08:21:57 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3572835", abstract = "Data sparsity has been a long-standing issue for accurate and trustworthy recommendation systems (RS). To alleviate the problem, many researchers pay \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "85", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Xue:2023:LDV, author = "Lyuxin Xue and Deqing Yang and Shuoyao Zhai and Yuxin Li and Yanghua Xiao", title = "Learning Dual-view User Representations for Enhanced Sequential Recommendation", journal = j-TOIS, volume = "41", number = "4", pages = "86:1--86:??", month = oct, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3572028", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Sep 20 08:21:57 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3572028", abstract = "Sequential recommendation (SR) aims to predict a user's next interacted item given his/her historical interactions. Most existing sequential recommendation \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "86", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Xu:2023:VGL, author = "Senrong Xu and Liangyue Li and Zenan Li and Yuan Yao and Feng Xu and Zulong Chen and Quan Lu and Hanghang Tong", title = "On the Vulnerability of Graph Learning-based Collaborative Filtering", journal = j-TOIS, volume = "41", number = "4", pages = "87:1--87:??", month = oct, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3572834", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Sep 20 08:21:57 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3572834", abstract = "Graph learning-based collaborative filtering (GLCF), which is built upon the message-passing mechanism of graph neural networks (GNNs), has received great recent \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "87", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Leonhardt:2023:EEI, author = "Jurek Leonhardt and Koustav Rudra and Avishek Anand", title = "Extractive Explanations for Interpretable Text Ranking", journal = j-TOIS, volume = "41", number = "4", pages = "88:1--88:??", month = oct, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3576924", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Sep 20 08:21:57 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3576924", abstract = "Neural document ranking models perform impressively well due to superior language understanding gained from pre-training tasks. However, due to their \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "88", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wu:2023:PPB, author = "Chen Wu and Ruqing Zhang and Jiafeng Guo and Maarten {De Rijke} and Yixing Fan and Xueqi Cheng", title = "{PRADA}: Practical Black-box Adversarial Attacks against Neural Ranking Models", journal = j-TOIS, volume = "41", number = "4", pages = "89:1--89:??", month = oct, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3576923", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Sep 20 08:21:57 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3576923", abstract = "Neural ranking models (NRMs) have shown remarkable success in recent years, especially with pre-trained language models. However, deep neural models are \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "89", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2023:LLF, author = "Honglei Zhang and Fangyuan Luo and Jun Wu and Xiangnan He and Yidong Li", title = "{LightFR}: Lightweight Federated Recommendation with Privacy-preserving Matrix Factorization", journal = j-TOIS, volume = "41", number = "4", pages = "90:1--90:??", month = oct, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3578361", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Sep 20 08:21:57 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3578361", abstract = "Federated recommender system (FRS), which enables many local devices to train a shared model jointly without transmitting local raw data, has become a prevalent \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "90", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{He:2023:ERS, author = "Liyang He and Zhenya Huang and Enhong Chen and Qi Liu and Shiwei Tong and Hao Wang and Defu Lian and Shijin Wang", title = "An Efficient and Robust Semantic Hashing Framework for Similar Text Search", journal = j-TOIS, volume = "41", number = "4", pages = "91:1--91:??", month = oct, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3570725", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Sep 20 08:21:57 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3570725", abstract = "Similar text search aims to find texts relevant to a given query from a database, which is fundamental in many information retrieval applications, such as \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "91", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Li:2023:TAI, author = "Qiming Li and Zhao Zhang and Fuzhen Zhuang and Yongjun Xu and Chao Li", title = "Topic-aware Intention Network for Explainable Recommendation with Knowledge Enhancement", journal = j-TOIS, volume = "41", number = "4", pages = "92:1--92:??", month = oct, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3579993", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Sep 20 08:21:57 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3579993", abstract = "Recently, recommender systems based on knowledge graphs (KGs) have become a popular research direction. Graph neural network (GNN) is the key \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "92", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Meng:2023:RNT, author = "Qing Meng and Hui Yan and Bo Liu and Xiangguo Sun and Mingrui Hu and Jiuxin Cao", title = "Recognize News Transition from Collective Behavior for News Recommendation", journal = j-TOIS, volume = "41", number = "4", pages = "93:1--93:??", month = oct, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3578362", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Sep 20 08:21:57 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3578362", abstract = "In the news recommendation, users are overwhelmed by thousands of news daily, which makes the users' behavior data have high sparsity. Therefore, only \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "93", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wang:2023:QRM, author = "Lingzhi Wang and Xingshan Zeng and Kam-Fai Wong", title = "Quotation Recommendation for Multi-party Online Conversations Based on Semantic and Topic Fusion", journal = j-TOIS, volume = "41", number = "4", pages = "94:1--94:??", month = oct, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3594633", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Sep 20 08:21:57 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3594633", abstract = "Quotations are crucial for successful explanations and persuasions in interpersonal communications. However, finding what to quote in a \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "94", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhao:2023:AAT, author = "Yan Zhao and Liwei Deng and Kai Zheng", title = "{AdaTaskRec}: an Adaptive Task Recommendation Framework in Spatial Crowdsourcing", journal = j-TOIS, volume = "41", number = "4", pages = "95:1--95:??", month = oct, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3593582", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Sep 20 08:21:57 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3593582", abstract = "Spatial crowdsourcing is one of the prime movers for the orchestration of location-based tasks, and task recommendation is a crucial means to help workers \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "95", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Mackenzie:2023:EDT, author = "Joel Mackenzie and Andrew Trotman and Jimmy Lin", title = "Efficient Document-at-a-time and Score-at-a-time Query Evaluation for Learned Sparse Representations", journal = j-TOIS, volume = "41", number = "4", pages = "96:1--96:??", month = oct, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3576922", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Sep 20 08:21:57 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3576922", abstract = "Researchers have had much recent success with ranking models based on so-called learned sparse representations generated by transformers. One crucial \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "96", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2023:MLA, author = "Xinyue Zhang and Jingjing Li and Hongzu Su and Lei Zhu and Heng Tao Shen", title = "Multi-level Attention-based Domain Disentanglement for {BCDR}", journal = j-TOIS, volume = "41", number = "4", pages = "97:1--97:??", month = oct, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3576925", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Sep 20 08:21:57 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3576925", abstract = "Cross-domain recommendation aims to exploit heterogeneous information from a data-sufficient domain (source domain) to transfer knowledge to a \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "97", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Qin:2023:LRU, author = "Jiarui Qin and Weinan Zhang and Rong Su and Zhirong Liu and Weiwen Liu and Guangpeng Zhao and Hao Li and Ruiming Tang and Xiuqiang He and Yong Yu", title = "Learning to Retrieve User Behaviors for Click-through Rate Estimation", journal = j-TOIS, volume = "41", number = "4", pages = "98:1--98:??", month = oct, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3579354", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Sep 20 08:21:57 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3579354", abstract = "Click-through rate (CTR) estimation plays a crucial role in modern online personalization services. It is essential to capture users' drifting interests by modeling \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "98", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Yao:2023:OAP, author = "Zijun Yao and Bin Liu and Fei Wang and Daby Sow and Ying Li", title = "Ontology-aware Prescription Recommendation in Treatment Pathways Using Multi-evidence Healthcare Data", journal = j-TOIS, volume = "41", number = "4", pages = "99:1--99:??", month = oct, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3579994", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Sep 20 08:21:57 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3579994", abstract = "For care of chronic diseases (e.g., depression, diabetes, hypertension), it is critical to identify effective treatment pathways that aim to promptly update the \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "99", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Somanchi:2023:EUH, author = "Sriram Somanchi and Ahmed Abbasi and Ken Kelley and David Dobolyi and Ted Tao Yuan", title = "Examining User Heterogeneity in Digital Experiments", journal = j-TOIS, volume = "41", number = "4", pages = "100:1--100:??", month = oct, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3578931", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Sep 20 08:21:57 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3578931", abstract = "Digital experiments are routinely used to test the value of a treatment relative to a status-quo control setting-for instance, a new search relevance algorithm for \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "100", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zheng:2023:ADR, author = "Ruiqi Zheng and Liang Qu and Bin Cui and Yuhui Shi and Hongzhi Yin", title = "{AutoML} for Deep Recommender Systems: a Survey", journal = j-TOIS, volume = "41", number = "4", pages = "101:1--101:??", month = oct, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3579355", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Sep 20 08:21:57 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3579355", abstract = "Recommender systems play a significant role in information filtering and have been utilized in different scenarios, such as e-commerce and social media. \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "101", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Xia:2023:EDS, author = "Xin Xia and Junliang Yu and Qinyong Wang and Chaoqun Yang and Nguyen Quoc Viet Hung and Hongzhi Yin", title = "Efficient On-Device Session-Based Recommendation", journal = j-TOIS, volume = "41", number = "4", pages = "102:1--102:??", month = oct, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3580364", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Sep 20 08:21:57 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3580364", abstract = "On-device session-based recommendation systems have been achieving increasing attention on account of the low energy/resource consumption and \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "102", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Li:2023:PPL, author = "Lei Li and Yongfeng Zhang and Li Chen", title = "Personalized Prompt Learning for Explainable Recommendation", journal = j-TOIS, volume = "41", number = "4", pages = "103:1--103:??", month = oct, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3580488", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Sep 20 08:21:57 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3580488", abstract = "Providing user-understandable explanations to justify recommendations could help users better understand the recommended items, increase the system's ease of use, \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "103", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Cui:2023:FGI, author = "Jiajun Cui and Zeyuan Chen and Aimin Zhou and Jianyong Wang and Wei Zhang", title = "Fine-Grained Interaction Modeling with Multi-Relational Transformer for Knowledge Tracing", journal = j-TOIS, volume = "41", number = "4", pages = "104:1--104:??", month = oct, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3580595", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Sep 20 08:21:57 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3580595", abstract = "Knowledge tracing, the goal of which is predicting students' future performance given their past question response sequences to trace their knowledge states, is \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "104", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Cheng:2023:CDM, author = "Zifeng Cheng and Zhiwei Jiang and Yafeng Yin and Cong Wang and Shiping Ge and Qing Gu", title = "A Consistent Dual-{MRC} Framework for Emotion-cause Pair Extraction", journal = j-TOIS, volume = "41", number = "4", pages = "105:1--105:??", month = oct, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3558548", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Sep 20 08:21:57 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3558548", abstract = "Emotion-cause pair extraction (ECPE) is a recently proposed task that aims to extract the potential clause pairs of emotions and its corresponding causes in a \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "105", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Yi:2023:MAA, author = "Jing Yi and Xubin Ren and Zhenzhong Chen", title = "Multi-auxiliary Augmented Collaborative Variational Auto-encoder for Tag Recommendation", journal = j-TOIS, volume = "41", number = "4", pages = "106:1--106:??", month = oct, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3578932", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Sep 20 08:21:57 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3578932", abstract = "Recommending appropriate tags to items can facilitate content organization, retrieval, consumption, and other applications, where hybrid tag recommender systems \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "106", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhou:2023:EMV, author = "Kun Zhou and Hui Wang and Ji-rong Wen and Wayne Xin Zhao", title = "Enhancing Multi-View Smoothness for Sequential Recommendation Models", journal = j-TOIS, volume = "41", number = "4", pages = "107:1--107:??", month = oct, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3582495", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Sep 20 08:21:57 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3582495", abstract = "Sequential recommendation models aim to predict the interested items to a user based on his historical behaviors. To train sequential recommenders, implicit \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "107", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Liu:2023:BSI, author = "Dugang Liu and Pengxiang Cheng and Zinan Lin and Xiaolian Zhang and Zhenhua Dong and Rui Zhang and Xiuqiang He and Weike Pan and Zhong Ming", title = "Bounding System-Induced Biases in Recommender Systems with a Randomized Dataset", journal = j-TOIS, volume = "41", number = "4", pages = "108:1--108:??", month = oct, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3582002", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Sep 20 08:21:57 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3582002", abstract = "Debiased recommendation with a randomized dataset has shown very promising results in mitigating system-induced biases. However, it still \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "108", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Dusart:2023:THS, author = "Alexis Dusart and Karen Pinel-Sauvagnat and Gilles Hubert", title = "{TSSuBERT}: How to Sum Up Multiple Years of Reading in a Few Tweets", journal = j-TOIS, volume = "41", number = "4", pages = "109:1--109:??", month = oct, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3581786", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Sep 20 08:21:57 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3581786", abstract = "The development of deep neural networks and the emergence of pre-trained language models such as BERT allow to increase performance on many NLP tasks. \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "109", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Lin:2023:DRF, author = "Sheng-Chieh Lin and Jimmy Lin", title = "A Dense Representation Framework for Lexical and Semantic Matching", journal = j-TOIS, volume = "41", number = "4", pages = "110:1--110:??", month = oct, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3582426", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Sep 20 08:21:57 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3582426", abstract = "Lexical and semantic matching capture different successful approaches to text retrieval and the fusion of their results has proven to be more effective and \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "110", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Si:2023:ERS, author = "Zihua Si and Zhongxiang Sun and Xiao Zhang and Jun Xu and Yang Song and Xiaoxue Zang and Ji-Rong Wen", title = "Enhancing Recommendation with Search Data in a Causal Learning Manner", journal = j-TOIS, volume = "41", number = "4", pages = "111:1--111:??", month = oct, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3582425", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Sep 20 08:21:57 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3582425", abstract = "Recommender systems are currently widely used in various applications helping people filter information. Existing models always embed the rich information for \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "111", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Xu:2023:TTG, author = "Ronghui Xu and Meng Chen and Yongshun Gong and Yang Liu and Xiaohui Yu and Liqiang Nie", title = "{TME}: Tree-guided Multi-task Embedding Learning towards Semantic Venue Annotation", journal = j-TOIS, volume = "41", number = "4", pages = "112:1--112:??", month = oct, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3582553", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Sep 20 08:21:57 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3582553", abstract = "The prevalence of location-based services has generated a deluge of check-ins, enabling the task of human mobility understanding. Among the various \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "112", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2023:CLL, author = "Han Zhang and Zhicheng Dou and Yutao Zhu and Ji-Rong Wen", title = "Contrastive Learning for Legal Judgment Prediction", journal = j-TOIS, volume = "41", number = "4", pages = "113:1--113:??", month = oct, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3580489", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Sep 20 08:21:57 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3580489", abstract = "Legal judgment prediction (LJP) is a fundamental task of legal artificial intelligence. It aims to automatically predict the judgment results of legal \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "113", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Yang:2023:DRU, author = "Mengyue Yang and Guohao Cai and Furui Liu and Jiarui Jin and Zhenhua Dong and Xiuqiang He and Jianye Hao and Weiqi Shao and Jun Wang and Xu Chen", title = "Debiased Recommendation with User Feature Balancing", journal = j-TOIS, volume = "41", number = "4", pages = "114:1--114:??", month = oct, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3580594", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Sep 20 08:21:57 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3580594", abstract = "Debiased recommendation has recently attracted increasing attention from both industry and academic communities. Traditional models mostly rely on \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "114", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Feng:2023:LMT, author = "Jiazhan Feng and Chongyang Tao and Xueliang Zhao and Dongyan Zhao", title = "Learning Multi-turn Response Selection in Grounded Dialogues with Reinforced Knowledge and Context Distillation", journal = j-TOIS, volume = "41", number = "4", pages = "115:1--115:??", month = oct, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3584701", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Sep 20 08:21:57 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3584701", abstract = "Recently, knowledge-grounded dialogue systems have gained increasing attention. Great efforts have been made to build response matching models where \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "115", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Li:2023:NBR, author = "Ming Li and Sami Jullien and Mozhdeh Ariannezhad and Maarten de Rijke", title = "A Next Basket Recommendation Reality Check", journal = j-TOIS, volume = "41", number = "4", pages = "116:1--116:??", month = oct, year = "2023", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3587153", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Sep 20 08:21:57 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3587153", abstract = "The goal of a next basket recommendation (NBR) system is to recommend items for the next basket for a user, based on the sequence of their prior baskets. We \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "116", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wei:2024:NAS, author = "Lanning Wei and Huan Zhao and Zhiqiang He and Quanming Yao", title = "Neural Architecture Search for {GNN}-Based Graph Classification", journal = j-TOIS, volume = "42", number = "1", pages = "1:1--1:??", month = jan, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3584945", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Nov 3 14:26:23 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3584945", abstract = "Graph classification is an important problem with applications across many domains, for which graph neural networks (GNNs) have been state-of-the-art (SOTA) methods. In the literature, to adopt GNNs for the graph classification task, there are two groups \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "1", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{McGregor:2024:SRC, author = "Molly McGregor and Leif Azzopardi and Martin Halvey", title = "A Systematic Review of Cost, Effort, and Load Research in Information Search and Retrieval, 1972--2020", journal = j-TOIS, volume = "42", number = "1", pages = "2:1--2:??", month = jan, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3583069", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Nov 3 14:26:23 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3583069", abstract = "During the information search and retrieval (ISR) process, user-system interactions such as submitting queries, examining results, and engaging with information impose some degree of demand on the user's resources. Within ISR, these demands are well \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "2", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Xu:2024:GBP, author = "Hongyan Xu and Qiyao Peng and Hongtao Liu and Yueheng Sun and Wenjun Wang", title = "Group-Based Personalized News Recommendation with Long- and Short-Term Fine-Grained Matching", journal = j-TOIS, volume = "42", number = "1", pages = "3:1--3:??", month = jan, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3584946", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Nov 3 14:26:23 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3584946", abstract = "Personalized news recommendation aims to help users find news content they prefer, which has attracted increasing attention recently. There are two core issues in news recommendation: learning news representation and matching candidate news with user \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2024:RSM, author = "Jin Zhang and Xinrui Li and Liye Wang", title = "A Review Selection Method Based on Consumer Decision Phases in E-commerce", journal = j-TOIS, volume = "42", number = "1", pages = "4:1--4:??", month = jan, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3587265", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Nov 3 14:26:23 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3587265", abstract = "A valuable small subset strategically selected from massive online reviews is beneficial to improve consumers' decision-making efficiency in e-commerce. Existing review selection methods primarily concentrate on the informativeness of reviews and aim to \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "4", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wu:2024:FDF, author = "Yao Wu and Jian Cao and Guandong Xu", title = "{FASTER}: a Dynamic Fairness-assurance Strategy for Session-based Recommender Systems", journal = j-TOIS, volume = "42", number = "1", pages = "5:1--5:??", month = jan, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3586993", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Nov 3 14:26:23 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3586993", abstract = "When only users' preferences and interests are considered by a recommendation algorithm, it will lead to the severe long-tail problem over items. Therefore, the unfair exposure phenomenon of recommended items caused by this problem has attracted \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "5", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Li:2024:CCP, author = "Xinhang Li and Zhaopeng Qiu and Jiacheng Jiang and Yong Zhang and Chunxiao Xing and Xian Wu", title = "Conditional Cross-Platform User Engagement Prediction", journal = j-TOIS, volume = "42", number = "1", pages = "6:1--6:??", month = jan, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3589226", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Nov 3 14:26:23 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3589226", abstract = "The bursting of media sharing platforms like TikTok, YouTube, and Kwai enables normal users to create and share content with worldwide audiences. The most popular YouTuber can attract up to 100 million followers. Since there are multiple popular platforms,. \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "6", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Rad:2024:VNA, author = "Radin Hamidi Rad and Hossein Fani and Ebrahim Bagheri and Mehdi Kargar and Divesh Srivastava and Jaroslaw Szlichta", title = "A Variational Neural Architecture for Skill-based Team Formation", journal = j-TOIS, volume = "42", number = "1", pages = "7:1--7:??", month = jan, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3589762", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Nov 3 14:26:23 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3589762", abstract = "Team formation is concerned with the identification of a group of experts who have a high likelihood of effectively collaborating with each other to satisfy a collection of input skills. Solutions to this task have mainly adopted graph operations and at \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "7", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{He:2024:MMA, author = "Liangliang He and Xiao Li and Pancheng Wang and Jintao Tang and Ting Wang", title = "{MAN}: Memory-augmented Attentive Networks for Deep Learning-based Knowledge Tracing", journal = j-TOIS, volume = "42", number = "1", pages = "8:1--8:??", month = jan, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3589340", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Nov 3 14:26:23 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3589340", abstract = "Knowledge Tracing (KT) is the task of modeling a learner's knowledge state to predict future performance in e-learning systems based on past performance. Deep learning-based methods, such as recurrent neural networks, memory-augmented neural networks, and \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "8", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Chen:2024:TRD, author = "Hai Chen and Fulan Qian and Chang Liu and Yanping Zhang and Hang Su and Shu Zhao", title = "Training Robust Deep Collaborative Filtering Models via Adversarial Noise Propagation", journal = j-TOIS, volume = "42", number = "1", pages = "9:1--9:??", month = jan, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3589000", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Nov 3 14:26:23 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3589000", abstract = "The recommendation performance of deep collaborative filtering models drops sharply under imperceptible adversarial perturbations. Some methods promote the robustness of recommendation systems by adversarial training. However, these methods only study \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "9", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Yan:2024:CRG, author = "Mingshi Yan and Zhiyong Cheng and Chen Gao and Jing Sun and Fan Liu and Fuming Sun and Haojie Li", title = "Cascading Residual Graph Convolutional Network for Multi-Behavior Recommendation", journal = j-TOIS, volume = "42", number = "1", pages = "10:1--10:??", month = jan, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3587693", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Nov 3 14:26:23 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3587693", abstract = "Multi-behavior recommendation exploits multiple types of user-item interactions, such as view and cart, to learn user preferences and has demonstrated to be an effective solution to alleviate the data sparsity problem faced by the traditional models that \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "10", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Sakai:2024:VFE, author = "Tetsuya Sakai and Jin Young Kim and Inho Kang", title = "A Versatile Framework for Evaluating Ranked Lists in Terms of Group Fairness and Relevance", journal = j-TOIS, volume = "42", number = "1", pages = "11:1--11:??", month = jan, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3589763", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Nov 3 14:26:23 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3589763", abstract = "We present a simple and versatile framework for evaluating ranked lists in terms of Group Fairness and Relevance, in which the groups (i.e., possible attribute values) can be either nominal or ordinal in nature. First, we demonstrate that when our \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "11", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wang:2024:CDR, author = "Wenjie Wang and Xinyu Lin and Liuhui Wang and Fuli Feng and Yunshan Ma and Tat-Seng Chua", title = "Causal Disentangled Recommendation against User Preference Shifts", journal = j-TOIS, volume = "42", number = "1", pages = "12:1--12:??", month = jan, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3593022", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Nov 3 14:26:23 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3593022", abstract = "Recommender systems easily face the issue of user preference shifts. User representations will become out-of-date and lead to inappropriate recommendations if user preference has shifted over time. To solve the issue, existing work focuses on learning \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "12", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2024:MMM, author = "Yazhou Zhang and Ao Jia and Bo Wang and Peng Zhang and Dongming Zhao and Pu Li and Yuexian Hou and Xiaojia Jin and Dawei Song and Jing Qin", title = "{M3GAT}: a Multi-modal, Multi-task Interactive Graph Attention Network for Conversational Sentiment Analysis and Emotion Recognition", journal = j-TOIS, volume = "42", number = "1", pages = "13:1--13:??", month = jan, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3593583", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Nov 3 14:26:23 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3593583", abstract = "Sentiment and emotion, which correspond to long-term and short-lived human feelings, are closely linked to each other, leading to the fact that sentiment analysis and emotion recognition are also two interdependent tasks in natural language processing \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "13", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Gao:2024:CBF, author = "Chongming Gao and Shiqi Wang and Shijun Li and Jiawei Chen and Xiangnan He and Wenqiang Lei and Biao Li and Yuan Zhang and Peng Jiang", title = "{CIRS}: Bursting Filter Bubbles by Counterfactual Interactive Recommender System", journal = j-TOIS, volume = "42", number = "1", pages = "14:1--14:??", month = jan, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3594871", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Nov 3 14:26:23 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3594871", abstract = "While personalization increases the utility of recommender systems, it also brings the issue of filter bubbles. e.g., if the system keeps exposing and recommending the items that the user is interested in, it may also make the user feel bored and less \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "14", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Sun:2024:MCN, author = "Zhu Sun and Yu Lei and Lu Zhang and Chen Li and Yew-Soon Ong and Jie Zhang", title = "A Multi-channel Next {POI} Recommendation Framework with Multi-granularity Check-in Signals", journal = j-TOIS, volume = "42", number = "1", pages = "15:1--15:??", month = jan, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3592789", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Nov 3 14:26:23 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3592789", abstract = "Current study on next point-of-interest (POI) recommendation mainly explores user sequential transitions with the fine-grained individual-user POI check-in trajectories only, which suffers from the severe check-in data sparsity issue. In fact, coarse-. \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "15", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wang:2024:MVE, author = "Dongjing Wang and Xin Zhang and Yuyu Yin and Dongjin Yu and Guandong Xu and Shuiguang Deng", title = "Multi-View Enhanced Graph Attention Network for Session-Based Music Recommendation", journal = j-TOIS, volume = "42", number = "1", pages = "16:1--16:??", month = jan, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3592853", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Nov 3 14:26:23 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3592853", abstract = "Traditional music recommender systems are mainly based on users' interactions, which limit their performance. Particularly, various kinds of content information, such as metadata and description can be used to improve music recommendation. However, it \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "16", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Sun:2024:MUS, author = "Weiwei Sun and Shuyu Guo and Shuo Zhang and Pengjie Ren and Zhumin Chen and Maarten de Rijke and Zhaochun Ren", title = "Metaphorical User Simulators for Evaluating Task-oriented Dialogue Systems", journal = j-TOIS, volume = "42", number = "1", pages = "17:1--17:??", month = jan, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3596510", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Nov 3 14:26:23 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3596510", abstract = "Task-oriented dialogue systems (TDSs) are assessed mainly in an offline setting or through human evaluation. The evaluation is often limited to single-turn or is very time-intensive. As an alternative, user simulators that mimic user behavior allow us to \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "17", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Qin:2024:LHS, author = "Yingrong Qin and Chen Gao and Shuangqing Wei and Yue Wang and Depeng Jin and Jian Yuan and Lin Zhang and Dong Li and Jianye Hao and Yong Li", title = "Learning from Hierarchical Structure of Knowledge Graph for Recommendation", journal = j-TOIS, volume = "42", number = "1", pages = "18:1--18:??", month = jan, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3595632", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Nov 3 14:26:23 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3595632", abstract = "Knowledge graphs (KGs) can help enhance recommendations, especially for the data-sparsity scenarios with limited user-item interaction data. Due to the strong power of representation learning of graph neural networks (GNNs), recent works of KG-based \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "18", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Rashidi:2024:IJV, author = "Lida Rashidi and Justin Zobel and Alistair Moffat", title = "The Impact of Judgment Variability on the Consistency of Offline Effectiveness Measures", journal = j-TOIS, volume = "42", number = "1", pages = "19:1--19:??", month = jan, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3596511", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Nov 3 14:26:23 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3596511", abstract = "Measurement of the effectiveness of search engines is often based on use of relevance judgments. It is well known that judgments can be inconsistent between judges, leading to discrepancies that potentially affect not only scores but also system \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "19", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Bruch:2024:AFF, author = "Sebastian Bruch and Siyu Gai and Amir Ingber", title = "An Analysis of Fusion Functions for Hybrid Retrieval", journal = j-TOIS, volume = "42", number = "1", pages = "20:1--20:??", month = jan, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3596512", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Nov 3 14:26:23 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3596512", abstract = "We study hybrid search in text retrieval where lexical and semantic search are fused together with the intuition that the two are complementary in how they model relevance. In particular, we examine fusion by a convex combination of lexical and semantic \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "20", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Roitero:2024:HMC, author = "Kevin Roitero and David {La Barbera} and Michael Soprano and Gianluca Demartini and Stefano Mizzaro and Tetsuya Sakai", title = "How Many Crowd Workers Do {I} Need? {On} Statistical Power when Crowdsourcing Relevance Judgments", journal = j-TOIS, volume = "42", number = "1", pages = "21:1--21:??", month = jan, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3597201", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Nov 3 14:26:23 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3597201", abstract = "To scale the size of Information Retrieval collections, crowdsourcing has become a common way to collect relevance judgments at scale. Crowdsourcing experiments usually employ 100-10,000 workers, but such a number is often decided in a heuristic way. The \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "21", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Huang:2024:DLR, author = "Heyan Huang and Changsen Yuan and Qian Liu and Yixin Cao", title = "Document-level Relation Extraction via Separate Relation Representation and Logical Reasoning", journal = j-TOIS, volume = "42", number = "1", pages = "22:1--22:??", month = jan, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3597610", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Nov 3 14:26:23 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3597610", abstract = "Document-level relation extraction (RE) extends the identification of entity/mentions' relation from the single sentence to the long document. It is more realistic and poses new challenges to relation representation and reasoning skills. In this article, \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "22", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Sakai:2024:OPW, author = "Tetsuya Sakai and Sijie Tao and Nuo Chen and Yujing Li and Maria Maistro and Zhumin Chu and Nicola Ferro", title = "On the Ordering of Pooled {Web} Pages, Gold Assessments, and Bronze Assessments", journal = j-TOIS, volume = "42", number = "1", pages = "23:1--23:??", month = jan, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3600227", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Nov 3 14:26:23 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3600227", abstract = "The present study leverages a recent opportunity we had to create a new English web search test collection for the NTCIR-16 We Want Web (WWW-4) task, which concluded in June 2022. More specifically, through the test collection construction effort, we \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "23", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Yin:2024:UDS, author = "Qing Yin and Hui Fang and Zhu Sun and Yew-Soon Ong", title = "Understanding Diversity in Session-based Recommendation", journal = j-TOIS, volume = "42", number = "1", pages = "24:1--24:??", month = jan, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3600226", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Nov 3 14:26:23 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3600226", abstract = "Current session-based recommender systems (SBRSs) mainly focus on maximizing recommendation accuracy, while few studies have been devoted to improve diversity beyond accuracy. Meanwhile, it is unclear how the accuracy-oriented SBRSs perform in terms of \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "24", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Jing:2024:SDT, author = "Liqiang Jing and Xuemeng Song and Xuming Lin and Zhongzhou Zhao and Wei Zhou and Liqiang Nie", title = "Stylized Data-to-text Generation: a Case Study in the E-Commerce Domain", journal = j-TOIS, volume = "42", number = "1", pages = "25:1--25:??", month = jan, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3603374", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Nov 3 14:26:23 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3603374", abstract = "Existing data-to-text generation efforts mainly focus on generating a coherent text from non-linguistic input data, such as tables and attribute-value pairs, but overlook that different application scenarios may require texts of different styles. Inspired \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "25", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Li:2024:INR, author = "Haoyang Li and Ziwei Zhang and Xin Wang and Wenwu Zhu", title = "Invariant Node Representation Learning under Distribution Shifts with Multiple Latent Environments", journal = j-TOIS, volume = "42", number = "1", pages = "26:1--26:??", month = jan, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3604427", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Nov 3 14:26:23 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3604427", abstract = "Node representation learning methods, such as graph neural networks, show promising results when testing and training graph data come from the same distribution. However, the existing approaches fail to generalize under distribution shifts when the nodes \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "26", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Qin:2024:ASO, author = "Chuan Qin and Hengshu Zhu and Dazhong Shen and Ying Sun and Kaichun Yao and Peng Wang and Hui Xiong", title = "Automatic Skill-Oriented Question Generation and Recommendation for Intelligent Job Interviews", journal = j-TOIS, volume = "42", number = "1", pages = "27:1--27:??", month = jan, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3604552", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Nov 3 14:26:23 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3604552", abstract = "Job interviews are the most widely accepted method for companies to select suitable candidates, and a critical challenge is finding the right questions to ask job candidates. Moreover, there is a lack of integrated tools for automatically generating \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "27", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Ni:2024:MCD, author = "Yuxin Ni and Yunwen Xia and Hui Fang and Chong Long and Xinyu Kong and Daqian Li and Dong Yang and Jie Zhang", title = "{Meta-CRS}: a Dynamic Meta-Learning Approach for Effective Conversational Recommender System", journal = j-TOIS, volume = "42", number = "1", pages = "28:1--28:??", month = jan, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3604804", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Nov 3 14:26:23 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3604804", abstract = "Conversational recommender system (CRS) enhances the recommender system by acquiring the latest user preference through dialogues, where an agent needs to decide ``whether to ask or recommend'', ``which attributes to ask'', and ``which items to recommend'' in \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "28", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Xu:2024:RMA, author = "Zhichao Xu and Hansi Zeng and Juntao Tan and Zuohui Fu and Yongfeng Zhang and Qingyao Ai", title = "A Reusable Model-agnostic Framework for Faithfully Explainable Recommendation and System Scrutability", journal = j-TOIS, volume = "42", number = "1", pages = "29:1--29:??", month = jan, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3605357", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Nov 3 14:26:23 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3605357", abstract = "State-of-the-art industrial-level recommender system applications mostly adopt complicated model structures such as deep neural networks. While this helps with the model performance, the lack of system explainability caused by these nearly blackbox models \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "29", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Meng:2024:CFK, author = "Chang Meng and Ziqi Zhao and Wei Guo and Yingxue Zhang and Haolun Wu and Chen Gao and Dong Li and Xiu Li and Ruiming Tang", title = "Coarse-to-Fine Knowledge-Enhanced Multi-Interest Learning Framework for Multi-Behavior Recommendation", journal = j-TOIS, volume = "42", number = "1", pages = "30:1--30:??", month = jan, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3606369", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Nov 3 14:26:23 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3606369", abstract = "Multi-types of behaviors (e.g., clicking, carting, purchasing, etc.) widely exist in most real-world recommendation scenarios, which are beneficial to learn users' multi-faceted preferences. As dependencies are explicitly exhibited by the multiple types \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "30", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Yang:2024:CKG, author = "Yang Yang and Chubing Zhang and Xin Song and Zheng Dong and Hengshu Zhu and Wenjie Li", title = "Contextualized Knowledge Graph Embedding for Explainable Talent Training Course Recommendation", journal = j-TOIS, volume = "42", number = "2", pages = "33:1--33:??", month = mar, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3597022", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu Dec 28 06:52:28 MST 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3597022", abstract = "Learning and development, or L\&D, plays an important role in talent management, which aims to improve the knowledge and capabilities of employees through a variety of performance-oriented training activities. Recently, with the rapid development of \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "33", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Yao:2024:DBL, author = "Yitong Yao and Jing Zhang and Peng Zhang and Yueheng Sun", title = "A Dual-branch Learning Model with Gradient-balanced Loss for Long-tailed Multi-label Text Classification", journal = j-TOIS, volume = "42", number = "2", pages = "34:1--34:??", month = mar, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3597416", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu Dec 28 06:52:28 MST 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3597416", abstract = "Multi-label text classification has a wide range of applications in the real world. However, the data distribution in the real world is often imbalanced, which leads to serious long-tailed problems. For multi-label classification, due to the vast scale of \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "34", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Lan:2024:TEC, author = "Tian Lan and Xian-Ling Mao and Wei Wei and Xiaoyan Gao and Heyan Huang", title = "Towards Efficient Coarse-grained Dialogue Response Selection", journal = j-TOIS, volume = "42", number = "2", pages = "35:1--35:??", month = mar, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3597609", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu Dec 28 06:52:28 MST 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3597609", abstract = "Coarse-grained response selection is a fundamental and essential subsystem for the widely used retrieval-based chatbots, aiming to recall a coarse-grained candidate set from a large-scale dataset. The dense retrieval technique has recently been proven \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "35", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Li:2024:PPR, author = "Canjia Li and Andrew Yates and Sean MacAvaney and Ben He and Yingfei Sun", title = "{PARADE}: Passage Representation Aggregation for Document Reranking", journal = j-TOIS, volume = "42", number = "2", pages = "36:1--36:??", month = mar, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3600088", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu Dec 28 06:52:28 MST 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3600088", abstract = "Pre-trained transformer models, such as BERT and T5, have shown to be highly effective at ad hoc passage and document ranking. Due to the inherent sequence length limits of these models, they need to process document passages one at a time rather than \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "36", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Xie:2024:HTS, author = "Jiayi Xie and Zhenzhong Chen", title = "Hierarchical Transformer with Spatio-temporal Context Aggregation for Next Point-of-interest Recommendation", journal = j-TOIS, volume = "42", number = "2", pages = "37:1--37:??", month = mar, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3597930", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu Dec 28 06:52:28 MST 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3597930", abstract = "Next point-of-interest (POI) recommendation is a critical task in location-based social networks, yet remains challenging due to a high degree of variation and personalization exhibited in user movements. In this work, we explore the latent hierarchical \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "37", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Xu:2024:SIG, author = "Chen Xu and Jun Xu and Zhenhua Dong and Ji-Rong Wen", title = "Syntactic-Informed Graph Networks for Sentence Matching", journal = j-TOIS, volume = "42", number = "2", pages = "38:1--38:??", month = mar, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3609795", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu Dec 28 06:52:28 MST 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3609795", abstract = "Matching two natural language sentences is a fundamental problem in both natural language processing and information retrieval. Preliminary studies have shown that the syntactic structures help improve the matching accuracy, and different syntactic \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "38", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2024:TBP, author = "Xinyu Zhang and Kelechi Ogueji and Xueguang Ma and Jimmy Lin", title = "Toward Best Practices for Training Multilingual Dense Retrieval Models", journal = j-TOIS, volume = "42", number = "2", pages = "39:1--39:??", month = mar, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3613447", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu Dec 28 06:52:28 MST 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3613447", abstract = "Dense retrieval models using a transformer-based bi-encoder architecture have emerged as an active area of research. In this article, we focus on the task of monolingual retrieval in a variety of typologically diverse languages using such an architecture. \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "39", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Ma:2024:ISI, author = "Yixiao Ma and Yueyue Wu and Qingyao Ai and Yiqun Liu and Yunqiu Shao and Min Zhang and Shaoping Ma", title = "Incorporating Structural Information into Legal Case Retrieval", journal = j-TOIS, volume = "42", number = "2", pages = "40:1--40:??", month = mar, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3609796", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu Dec 28 06:52:28 MST 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3609796", abstract = "Legal case retrieval has received increasing attention in recent years. However, compared to ad hoc retrieval tasks, legal case retrieval has its unique challenges. First, case documents are rather lengthy and contain complex legal structures. Therefore, \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "40", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Sun:2024:BGS, author = "Yatong Sun and Xiaochun Yang and Zhu Sun and Bin Wang", title = "{BERD+}: a Generic Sequential Recommendation Framework by Eliminating Unreliable Data with Item- and Attribute-level Signals", journal = j-TOIS, volume = "42", number = "2", pages = "41:1--41:??", month = mar, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3611008", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu Dec 28 06:52:28 MST 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3611008", abstract = "Most sequential recommendation systems (SRSs) predict the next item as the target for users given its preceding items as input, assuming the target is definitely related to its input. However, users may unintentionally click items that are inconsistent \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "41", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Bruch:2024:AAM, author = "Sebastian Bruch and Franco Maria Nardini and Amir Ingber and Edo Liberty", title = "An Approximate Algorithm for Maximum Inner Product Search over Streaming Sparse Vectors", journal = j-TOIS, volume = "42", number = "2", pages = "42:1--42:??", month = mar, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3609797", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu Dec 28 06:52:28 MST 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3609797", abstract = "Maximum Inner Product Search or top- k retrieval on sparse vectors is well understood in information retrieval, with a number of mature algorithms that solve it exactly. However, all existing algorithms are tailored to text and frequency-based similarity \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "42", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2024:SSL, author = "Shengyu Zhang and Tan Jiang and Kun Kuang and Fuli Feng and Jin Yu and Jianxin Ma and Zhou Zhao and Jianke Zhu and Hongxia Yang and Tat-Seng Chua and Fei Wu", title = "{SLED}: Structure Learning based Denoising for Recommendation", journal = j-TOIS, volume = "42", number = "2", pages = "43:1--43:??", month = mar, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3611385", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu Dec 28 06:52:28 MST 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3611385", abstract = "In recommender systems, click behaviors play a fundamental role in mining users' interests and training models (clicked items as positive samples). Such signals are implicit feedback and are arguably less representative of users' inherent interests. Most \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "43", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Quan:2024:AVL, author = "Yuhan Quan and Jingtao Ding and Chen Gao and Nian Li and Lingling Yi and Depeng Jin and Yong Li", title = "Alleviating Video-length Effect for Micro-video Recommendation", journal = j-TOIS, volume = "42", number = "2", pages = "44:1--44:??", month = mar, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3617826", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu Dec 28 06:52:28 MST 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3617826", abstract = "Micro-video platforms such as TikTok are extremely popular nowadays. One important feature is that users no longer select interested videos from a set; instead, they either watch the recommended video or skip to the next one. As a result, the time length \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "44", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Liu:2024:HEN, author = "Sannyuya Liu and Shengyingjie Liu and Zongkai Yang and Jianwen Sun and Xiaoxuan Shen and Qing Li and Rui Zou and Shangheng Du", title = "Heterogeneous Evolution Network Embedding with Temporal Extension for Intelligent Tutoring Systems", journal = j-TOIS, volume = "42", number = "2", pages = "45:1--45:??", month = mar, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3617828", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu Dec 28 06:52:28 MST 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3617828", abstract = "Graph embedding (GE) aims to acquire low-dimensional node representations while maintaining the graph's structural and semantic attributes. Intelligent tutoring systems (ITS) signify a noteworthy achievement in the fusion of AI and education. Utilizing GE \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "45", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Niu:2024:PAI, author = "Yanrui Niu and Chao Liang and Ankang Lu and Baojin Huang and Zhongyuan Wang and Jiahao Guo", title = "Person-action Instance Search in Story Videos: an Experimental Study", journal = j-TOIS, volume = "42", number = "2", pages = "46:1--46:??", month = mar, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3617892", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu Dec 28 06:52:28 MST 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3617892", abstract = "Person-Action instance search (P-A INS) aims to retrieve the instances of a specific person doing a specific action, which appears in the 2019-2021 INS tasks of the world-famous TREC Video Retrieval Evaluation (TRECVID). Most of the top-ranking solutions \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "46", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Liu:2024:DMF, author = "Han Liu and Yinwei Wei and Fan Liu and Wenjie Wang and Liqiang Nie and Tat-Seng Chua", title = "Dynamic Multimodal Fusion via Meta-Learning Towards Micro-Video Recommendation", journal = j-TOIS, volume = "42", number = "2", pages = "47:1--47:??", month = mar, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3617827", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu Dec 28 06:52:28 MST 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3617827", abstract = "Multimodal information (e.g., visual, acoustic, and textual) has been widely used to enhance representation learning for micro-video recommendation. For integrating multimodal information into a joint representation of micro-video, multimodal fusion plays \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "47", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Guo:2024:DDA, author = "Lei Guo and Hao Liu and Lei Zhu and Weili Guan and Zhiyong Cheng", title = "{DA-DAN}: a Dual Adversarial Domain Adaption Network for Unsupervised Non-overlapping Cross-domain Recommendation", journal = j-TOIS, volume = "42", number = "2", pages = "48:1--48:??", month = mar, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3617825", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu Dec 28 06:52:28 MST 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3617825", abstract = "Unsupervised Non-overlapping Cross-domain Recommendation (UNCR) is the task that recommends source domain items to the target domain users, which is more challenging as the users are non-overlapped, and its learning process is unsupervised. Unsupervised \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "48", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Ma:2024:PDK, author = "Longxuan Ma and Jiapeng Li and Mingda Li and Wei-Nan Zhang and Ting Liu", title = "Policy-driven Knowledge Selection and Response Generation for Document-grounded Dialogue", journal = j-TOIS, volume = "42", number = "2", pages = "49:1--49:??", month = mar, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3617829", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu Dec 28 06:52:28 MST 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3617829", abstract = "Document-grounded dialogue (DGD) uses documents as external knowledge for dialogue generation. Correctly understanding the dialogue context is crucial for selecting knowledge from the document and generating proper responses. In this article, we propose \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "49", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Hu:2024:SCL, author = "Yupeng Hu and Kun Wang and Meng Liu and Haoyu Tang and Liqiang Nie", title = "Semantic Collaborative Learning for Cross-Modal Moment Localization", journal = j-TOIS, volume = "42", number = "2", pages = "50:1--50:??", month = mar, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3620669", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu Dec 28 06:52:28 MST 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3620669", abstract = "Localizing a desired moment within an untrimmed video via a given natural language query, i.e., cross-modal moment localization, has attracted widespread research attention recently. However, it is a challenging task because it requires not only \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "50", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wang:2024:MAG, author = "Ke Wang and Yanmin Zhu and Tianzi Zang and Chunyang Wang and Kuan Liu and Peibo Ma", title = "Multi-aspect Graph Contrastive Learning for Review-enhanced Recommendation", journal = j-TOIS, volume = "42", number = "2", pages = "51:1--51:??", month = mar, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3618106", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu Dec 28 06:52:28 MST 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3618106", abstract = "Review-based recommender systems explore semantic aspects of users' preferences by incorporating user-generated reviews into rating-based models. Recent works have demonstrated the potential of review information to improve the recommendation capacity. \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "51", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Shi:2024:RPB, author = "Xiaoyu Shi and Quanliang Liu and Hong Xie and Di Wu and Bo Peng and MingSheng Shang and Defu Lian", title = "Relieving Popularity Bias in Interactive Recommendation: a Diversity-Novelty-Aware Reinforcement Learning Approach", journal = j-TOIS, volume = "42", number = "2", pages = "52:1--52:??", month = mar, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3618107", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu Dec 28 06:52:28 MST 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3618107", abstract = "While personalization increases the utility of item recommendation, it also suffers from the issue of popularity bias. However, previous methods emphasize adopting supervised learning models to relieve popularity bias in the static recommendation, \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "52", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Chen:2024:MDS, author = "Xiaolin Chen and Xuemeng Song and Liqiang Jing and Shuo Li and Linmei Hu and Liqiang Nie", title = "Multimodal Dialog Systems with Dual Knowledge-enhanced Generative Pretrained Language Model", journal = j-TOIS, volume = "42", number = "2", pages = "53:1--53:??", month = mar, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3606368", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu Dec 28 06:52:28 MST 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3606368", abstract = "Text response generation for multimodal task-oriented dialog systems, which aims to generate the proper text response given the multimodal context, is an essential yet challenging task. Although existing efforts have achieved compelling success, they \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "53", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Qin:2024:DMP, author = "Yifang Qin and Hongjun Wu and Wei Ju and Xiao Luo and Ming Zhang", title = "A Diffusion Model for {POI} Recommendation", journal = j-TOIS, volume = "42", number = "2", pages = "54:1--54:??", month = mar, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3624475", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu Dec 28 06:52:28 MST 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3624475", abstract = "Next Point-of-Interest (POI) recommendation is a critical task in location-based services that aim to provide personalized suggestions for the user's next destination. Previous works on POI recommendation have laid focus on modeling the user's spatial \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "54", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Siro:2024:UPU, author = "Clemencia Siro and Mohammad Aliannejadi and Maarten {De Rijke}", title = "Understanding and Predicting User Satisfaction with Conversational Recommender Systems", journal = j-TOIS, volume = "42", number = "2", pages = "55:1--55:??", month = mar, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3624989", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu Dec 28 06:52:28 MST 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3624989", abstract = "User satisfaction depicts the effectiveness of a system from the user's perspective. Understanding and predicting user satisfaction is vital for the design of user-oriented evaluation methods for conversational recommender systems (CRSs). Current \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "55", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wang:2024:SSB, author = "Chao Wang and Hengshu Zhu and Chen Zhu and Chuan Qin and Enhong Chen and Hui Xiong", title = "{SetRank}: a Setwise {Bayesian} Approach for Collaborative Ranking in Recommender System", journal = j-TOIS, volume = "42", number = "2", pages = "56:1--56:??", month = mar, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3626194", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu Dec 28 06:52:28 MST 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3626194", abstract = "The recent development of recommender systems has a focus on collaborative ranking, which provides users with a sorted list rather than rating prediction. The sorted item lists can more directly reflect the preferences for users and usually perform better \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "56", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Xu:2024:NPM, author = "Shicheng Xu and Liang Pang and Huawei Shen and Xueqi Cheng", title = "{NIR-Prompt}: a Multi-task Generalized Neural Information Retrieval Training Framework", journal = j-TOIS, volume = "42", number = "2", pages = "57:1--57:??", month = mar, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3626092", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu Dec 28 06:52:28 MST 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3626092", abstract = "Information retrieval aims to find information that meets users' needs from the corpus. Different needs correspond to different IR tasks such as document retrieval, open-domain question answering, retrieval-based dialogue, and so on, while they share the \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "57", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wan:2024:STC, author = "Zhongwei Wan and Xin Liu and Benyou Wang and Jiezhong Qiu and Boyu Li and Ting Guo and Guangyong Chen and Yang Wang", title = "Spatio-temporal Contrastive Learning-enhanced {GNNs} for Session-based Recommendation", journal = j-TOIS, volume = "42", number = "2", pages = "58:1--58:??", month = mar, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3626091", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu Dec 28 06:52:28 MST 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3626091", abstract = "Session-based recommendation (SBR) systems aim to utilize the user's short-term behavior sequence to predict the next item without the detailed user profile. Most recent works try to model the user preference by treating the sessions as between-item \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "58", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Jing:2024:CSS, author = "Mengyuan Jing and Yanmin Zhu and Tianzi Zang and Ke Wang", title = "Contrastive Self-supervised Learning in Recommender Systems: a Survey", journal = j-TOIS, volume = "42", number = "2", pages = "59:1--59:??", month = mar, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3627158", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu Dec 28 06:52:28 MST 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3627158", abstract = "Deep learning-based recommender systems have achieved remarkable success in recent years. However, these methods usually heavily rely on labeled data (i.e., user-item interactions), suffering from problems such as data sparsity and cold-start. Self-. \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "59", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Yi:2024:CGP, author = "Zixuan Yi and Iadh Ounis and Craig MacDonald", title = "Contrastive Graph Prompt-tuning for Cross-domain Recommendation", journal = j-TOIS, volume = "42", number = "2", pages = "60:1--60:??", month = mar, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3618298", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu Dec 28 06:52:28 MST 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3618298", abstract = "Recommender systems commonly suffer from the long-standing data sparsity problem where insufficient user-item interaction data limits the systems' ability to make accurate recommendations. This problem can be alleviated using cross-domain recommendation \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "60", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Bassani:2024:PQE, author = "Elias Bassani and Nicola Tonellotto and Gabriella Pasi", title = "Personalized Query Expansion with Contextual Word Embeddings", journal = j-TOIS, volume = "42", number = "2", pages = "61:1--61:??", month = mar, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3624988", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu Dec 28 06:52:28 MST 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3624988", abstract = "Personalized Query Expansion, the task of expanding queries with additional terms extracted from the user-related vocabulary, is a well-known solution to improve the retrieval performance of a system w.r.t. short queries. Recent approaches rely on word \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "61", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Shao:2024:ITL, author = "Yunqiu Shao and Haitao Li and Yueyue Wu and Yiqun Liu and Qingyao Ai and Jiaxin Mao and Yixiao Ma and Shaoping Ma", title = "An Intent Taxonomy of Legal Case Retrieval", journal = j-TOIS, volume = "42", number = "2", pages = "62:1--62:??", month = mar, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3626093", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu Dec 28 06:52:28 MST 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3626093", abstract = "Legal case retrieval is a special Information Retrieval (IR) task focusing on legal case documents. Depending on the downstream tasks of the retrieved case documents, users' information needs in legal case retrieval could be significantly different from \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "62", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Yin:2024:HHH, author = "Zhizhuo Yin and Kai Han and Pengzi Wang and Xi Zhu", title = "{H3GNN}: Hybrid Hierarchical {HyperGraph} Neural Network for Personalized Session-based Recommendation", journal = j-TOIS, volume = "42", number = "3", pages = "63:1--63:??", month = may, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3630002", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri May 10 08:15:31 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3630002", abstract = "Personalized Session-based recommendation (PSBR) is a general and challenging task in the real world, aiming to recommend a session's next clicked item based on the session's item transition information and the corresponding user's historical sessions. A \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "63", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Yuan:2024:MVA, author = "Wei Yuan and Shilong Yuan and Chaoqun Yang and Nguyen Quoc Viet hung and Hongzhi Yin", title = "Manipulating Visually Aware Federated Recommender Systems and Its Countermeasures", journal = j-TOIS, volume = "42", number = "3", pages = "64:1--64:??", month = may, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3630005", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri May 10 08:15:31 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3630005", abstract = "Federated recommender systems (FedRecs) have been widely explored recently due to their capability to safeguard user data privacy. These systems enable a central server to collaboratively learn recommendation models by sharing public parameters with \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "64", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Choi:2024:BUP, author = "Bogeum Choi and Sarah Casteel and Jaime Arguello and Robert Capra", title = "Better Understanding Procedural Search Tasks: Perceptions, Behaviors, and Challenges", journal = j-TOIS, volume = "42", number = "3", pages = "65:1--65:??", month = may, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3630004", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri May 10 08:15:31 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3630004", abstract = "People often search for information to acquire procedural knowledge-``how to'' knowledge about step-by-step procedures, methods, algorithms, techniques, heuristics, and skills. A procedural search task might involve implementing a solution to a problem, \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "65", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Li:2024:DDM, author = "Zihao Li and Aixin Sun and Chenliang Li", title = "{DiffuRec}: a Diffusion Model for Sequential Recommendation", journal = j-TOIS, volume = "42", number = "3", pages = "66:1--66:??", month = may, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3631116", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri May 10 08:15:31 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3631116", abstract = "Mainstream solutions to sequential recommendation represent items with fixed vectors. These vectors have limited capability in capturing items' latent aspects and users' diverse preferences. As a new generative paradigm, diffusion models have achieved \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "66", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Ni:2024:CPS, author = "Xuelian Ni and Fei Xiong and Shirui Pan and Jia Wu and Liang Wang and Hongshu Chen", title = "Community Preserving Social Recommendation with Cyclic Transfer Learning", journal = j-TOIS, volume = "42", number = "3", pages = "67:1--67:??", month = may, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3631115", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri May 10 08:15:31 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3631115", abstract = "Transfer learning-based recommendation mitigates the sparsity of user-item interactions by introducing auxiliary domains. Social influence extracted from direct connections between users typically serves as an auxiliary domain to improve prediction \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "67", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2024:BPL, author = "Xiaokun Zhang and Bo Xu and Fenglong Ma and Chenliang Li and Yuan Lin and Hongfei Lin", title = "{Bi}-preference Learning Heterogeneous Hypergraph Networks for Session-based Recommendation", journal = j-TOIS, volume = "42", number = "3", pages = "68:1--68:??", month = may, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3631940", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri May 10 08:15:31 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3631940", abstract = "Session-based recommendation intends to predict next purchased items based on anonymous behavior sequences. Numerous economic studies have revealed that item price is a key factor influencing user purchase decisions. Unfortunately, existing methods for \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "68", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Giner:2024:IRE, author = "Fernando Giner", title = "Information Retrieval Evaluation Measures Defined on Some Axiomatic Models of Preferences", journal = j-TOIS, volume = "42", number = "3", pages = "69:1--69:??", month = may, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3632171", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri May 10 08:15:31 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3632171", abstract = "Information retrieval (IR) evaluation measures are essential for capturing the relevance of documents to topics and determining the task performance efficiency of retrieval systems. The study of IR evaluation measures through their formal properties \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "69", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2024:TDL, author = "Yuting Zhang and Ying Sun and Fuzhen Zhuang and Yongchun Zhu and Zhulin An and Yongjun Xu", title = "Triple Dual Learning for Opinion-based Explainable Recommendation", journal = j-TOIS, volume = "42", number = "3", pages = "70:1--70:??", month = may, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3631521", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri May 10 08:15:31 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3631521", abstract = "Recently, with the aim of enhancing the trustworthiness of recommender systems, explainable recommendation has attracted much attention from the research community. Intuitively, users' opinions toward different aspects of an item determine their ratings \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "70", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2024:RAS, author = "Yitao Zhang and Changxuan Wan and Keli Xiao and Qizhi Wan and Dexi Liu and Xiping Liu", title = "{rHDP}: an Aspect Sharing-Enhanced Hierarchical Topic Model for Multi-Domain Corpus", journal = j-TOIS, volume = "42", number = "3", pages = "71:1--71:??", month = may, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3631352", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri May 10 08:15:31 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3631352", abstract = "Learning topic hierarchies from a multi-domain corpus is crucial in topic modeling as it reveals valuable structural information embedded within documents. Despite the extensive literature on hierarchical topic models, effectively discovering inter-topic \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "71", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Hu:2024:DPD, author = "Kaixi Hu and Lin Li and Qing Xie and Jianquan Liu and Xiaohui Tao and Guandong Xu", title = "Decoupled Progressive Distillation for Sequential Prediction with Interaction Dynamics", journal = j-TOIS, volume = "42", number = "3", pages = "72:1--72:??", month = may, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3632403", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri May 10 08:15:31 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3632403", abstract = "Sequential prediction has great value for resource allocation due to its capability in analyzing intents for next prediction. A fundamental challenge arises from real-world interaction dynamics where similar sequences involving multiple intents may \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "72", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Stevenson:2024:SMT, author = "Mark Stevenson and Reem Bin-Hezam", title = "Stopping Methods for Technology-assisted Reviews Based on Point Processes", journal = j-TOIS, volume = "42", number = "3", pages = "73:1--73:??", month = may, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3631990", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri May 10 08:15:31 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3631990", abstract = "Technology-assisted Review (TAR), which aims to reduce the effort required to screen collections of documents for relevance, is used to develop systematic reviews of medical evidence and identify documents that must be disclosed in response to legal \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "73", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Mei:2024:IFS, author = "Lang Mei and Jiaxin Mao and Juan Hu and Naiqiang Tan and Hua Chai and Ji-Rong Wen", title = "Improving First-stage Retrieval of Point-of-interest Search by Pre-training Models", journal = j-TOIS, volume = "42", number = "3", pages = "74:1--74:??", month = may, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3631937", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri May 10 08:15:31 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3631937", abstract = "Point-of-interest (POI) search is important for location-based services, such as navigation and online ride-hailing service. The goal of POI search is to find the most relevant destinations from a large-scale POI database given a text query. To improve \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "74", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wu:2024:LTI, author = "Jiaxin Wu and Chong-Wah Ngo and Wing-Kwong Chan and Zhijian Hou", title = "{(Un)likelihood} Training for Interpretable Embedding", journal = j-TOIS, volume = "42", number = "3", pages = "75:1--75:??", month = may, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3632752", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri May 10 08:15:31 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3632752", abstract = "Cross-modal representation learning has become a new normal for bridging the semantic gap between text and visual data. Learning modality agnostic representations in a continuous latent space, however, is often treated as a black-box data-driven training \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "75", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zang:2024:CMV, author = "Tianzi Zang and Yanmin Zhu and Ruohan Zhang and Chunyang Wang and Ke Wang and Jiadi Yu", title = "Contrastive Multi-view Interest Learning for Cross-domain Sequential Recommendation", journal = j-TOIS, volume = "42", number = "3", pages = "76:1--76:??", month = may, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3632402", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri May 10 08:15:31 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3632402", abstract = "Cross-domain recommendation (CDR), which leverages information collected from other domains, has been empirically demonstrated to effectively alleviate data sparsity and cold-start problems encountered in traditional recommendation systems. However, \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "76", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Krasakis:2024:CEC, author = "Antonios Minas Krasakis and Andrew Yates and Evangelos Kanoulas", title = "Contextualizing and Expanding Conversational Queries without Supervision", journal = j-TOIS, volume = "42", number = "3", pages = "77:1--77:??", month = may, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3632622", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri May 10 08:15:31 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3632622", abstract = "Most conversational passage retrieval systems try to resolve conversational dependencies by using an intermediate query resolution step. To do so, they synthesize conversational data or assume the availability of large-scale question rewriting datasets. \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "77", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Cui:2024:DDG, author = "Chaoran Cui and Yumo Yao and Chunyun Zhang and Hebo Ma and Yuling Ma and Zhaochun Ren and Chen Zhang and James Ko", title = "{DGEKT}: a Dual Graph Ensemble Learning Method for Knowledge Tracing", journal = j-TOIS, volume = "42", number = "3", pages = "78:1--78:??", month = may, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3638350", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri May 10 08:15:31 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3638350", abstract = "Knowledge tracing aims to trace students' evolving knowledge states by predicting their future performance on concept-related exercises. Recently, some graph-based models have been developed to incorporate the relationships between exercises to improve \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "78", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Michalkova:2024:UFK, author = "Dominika Michalkova and Mario Parra Rodriguez and Yashar Moshfeghi", title = "Understanding Feeling-of-Knowing in Information Search: an {EEG} Study", journal = j-TOIS, volume = "42", number = "3", pages = "79:1--79:??", month = may, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3611384", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri May 10 08:15:31 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3611384", abstract = "The realisation and the variability of information needs (IN) with respect to a searcher's gap in knowledge is driven by the perceived Anomalous State of Knowledge (ASK). The concept of Feeling-of-Knowing (FOK), as the introspective feeling of knowledge \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "79", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2024:RCF, author = "An Zhang and Wenchang Ma and Jingnan Zheng and Xiang Wang and Tat-Seng Chua", title = "Robust Collaborative Filtering to Popularity Distribution Shift", journal = j-TOIS, volume = "42", number = "3", pages = "80:1--80:??", month = may, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3627159", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri May 10 08:15:31 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3627159", abstract = "In leading collaborative filtering (CF) models, representations of users and items are prone to learn popularity bias in the training data as shortcuts. The popularity shortcut tricks are good for in-distribution (ID) performance but poorly generalized to \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "80", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wang:2024:PDR, author = "Shuting Wang and Zhicheng Dou and Jiongnan Liu and Qiannan Zhu and Ji-Rong Wen", title = "Personalized and Diversified: Ranking Search Results in an Integrated Way", journal = j-TOIS, volume = "42", number = "3", pages = "81:1--81:??", month = may, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3631989", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri May 10 08:15:31 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3631989", abstract = "Ambiguity in queries is a common problem in information retrieval. There are currently two solutions: search result personalization and diversification. The former aims to tailor results for different users based on their preferences, but the limitations \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "81", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Fu:2024:PPI, author = "Wenjie Fu and Huandong Wang and Chen Gao and Guanghua Liu and Yong Li and Tao Jiang", title = "Privacy-Preserving Individual-Level {COVID-19} Infection Prediction via Federated Graph Learning", journal = j-TOIS, volume = "42", number = "3", pages = "82:1--82:??", month = may, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3633202", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri May 10 08:15:31 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3633202", abstract = "Accurately predicting individual-level infection state is of great value since its essential role in reducing the damage of the epidemic. However, there exists an inescapable risk of privacy leakage in the fine-grained user mobility trajectories required \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "82", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Su:2024:CDR, author = "Hongzu Su and Jingjing Li and Zhekai Du and Lei Zhu and Ke Lu and Heng Tao Shen", title = "Cross-domain Recommendation via Dual Adversarial Adaptation", journal = j-TOIS, volume = "42", number = "3", pages = "83:1--83:??", month = may, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3632524", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri May 10 08:15:31 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3632524", abstract = "Data scarcity is a perpetual challenge of recommendation systems, and researchers have proposed a variety of cross-domain recommendation methods to alleviate the problem of data scarcity in target domains. However, in many real-world cross-domain \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "83", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Lan:2024:EDR, author = "Tian Lan and Deng Cai and Yan Wang and Yixuan Su and Heyan Huang and Xian-Ling Mao", title = "Exploring Dense Retrieval for Dialogue Response Selection", journal = j-TOIS, volume = "42", number = "3", pages = "84:1--84:??", month = may, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3632750", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri May 10 08:15:31 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3632750", abstract = "Recent progress in deep learning has continuously improved the accuracy of dialogue response selection. However, in real-world scenarios, the high computation cost forces existing dialogue response selection models to rank only a small number of \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "84", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Peng:2024:LMR, author = "Shaowen Peng and Kazunari Sugiyama and Tsunenori Mine", title = "Less is More: Removing Redundancy of Graph Convolutional Networks for Recommendation", journal = j-TOIS, volume = "42", number = "3", pages = "85:1--85:??", month = may, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3632751", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri May 10 08:15:31 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3632751", abstract = "While Graph Convolutional Networks (GCNs) have shown great potential in recommender systems and collaborative filtering (CF), they suffer from expensive computational complexity and poor scalability. On top of that, recent works mostly combine GCNs with \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "85", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Gao:2024:SEA, author = "Jingtong Gao and Xiangyu Zhao and Muyang Li and Minghao Zhao and Runze Wu and Ruocheng Guo and Yiding Liu and Dawei Yin", title = "{SMLP4Rec}: an Efficient {All-MLP} Architecture for Sequential Recommendations", journal = j-TOIS, volume = "42", number = "3", pages = "86:1--86:??", month = may, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3637871", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri May 10 08:15:31 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3637871", abstract = "Self-attention models have achieved the state-of-the-art performance in sequential recommender systems by capturing the sequential dependencies among user-item interactions. However, they rely on adding positional embeddings to the item sequence to retain \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "86", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Xu:2024:ISE, author = "Jiechen Xu and Lei Han and Shazia Sadiq and Gianluca Demartini", title = "On the Impact of Showing Evidence from Peers in Crowdsourced Truthfulness Assessments", journal = j-TOIS, volume = "42", number = "3", pages = "87:1--87:??", month = may, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3637872", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri May 10 08:15:31 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3637872", abstract = "Misinformation has been rapidly spreading online. The common approach to dealing with it is deploying expert fact-checkers who follow forensic processes to identify the veracity of statements. Unfortunately, such an approach does not scale well. To deal \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "87", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Gao:2024:CIR, author = "Chen Gao and Yu Zheng and Wenjie Wang and Fuli Feng and Xiangnan He and Yong Li", title = "Causal Inference in Recommender Systems: a Survey and Future Directions", journal = j-TOIS, volume = "42", number = "4", pages = "88:1--88:??", month = jul, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3639048", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu May 16 10:57:30 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3639048", abstract = "Recommender systems have become crucial in information filtering nowadays. Existing recommender systems extract user preferences based on the correlation in data, such as behavioral correlation in collaborative filtering, feature-feature, or feature-. \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "88", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhao:2024:DTR, author = "Wayne Xin Zhao and Jing Liu and Ruiyang Ren and Ji-Rong Wen", title = "Dense Text Retrieval Based on Pretrained Language Models: a Survey", journal = j-TOIS, volume = "42", number = "4", pages = "89:1--89:??", month = jul, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3637870", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu May 16 10:57:30 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3637870", abstract = "Text retrieval is a long-standing research topic on information seeking, where a system is required to return relevant information resources to user's queries in natural language. From heuristic-based retrieval methods to learning-based ranking functions, \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "89", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhu:2024:UMR, author = "Zhengbang Zhu and Rongjun Qin and Junjie Huang and Xinyi Dai and Yang Yu and Yong Yu and Weinan Zhang", title = "Understanding or Manipulation: Rethinking Online Performance Gains of Modern Recommender Systems", journal = j-TOIS, volume = "42", number = "4", pages = "90:1--90:??", month = jul, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3637869", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu May 16 10:57:30 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3637869", abstract = "Recommender systems are expected to be assistants that help human users find relevant information automatically without explicit queries. As recommender systems evolve, increasingly sophisticated learning techniques are applied and have achieved better \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "90", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Ma:2024:TSL, author = "Haokai Ma and Ruobing Xie and Lei Meng and Xin Chen and Xu Zhang and Leyu Lin and Jie Zhou", title = "Triple Sequence Learning for Cross-domain Recommendation", journal = j-TOIS, volume = "42", number = "4", pages = "91:1--91:??", month = jul, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3638351", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu May 16 10:57:30 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3638351", abstract = "Cross-domain recommendation (CDR) aims at leveraging the correlation of users' behaviors in both the source and target domains to improve the user preference modeling in the target domain. Conventional CDR methods typically explore the dual-relations \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "91", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Razgallah:2024:UNG, author = "H{\'e}di Razgallah and Michalis Vlachos and Ahmad Ajalloeian and Ninghao Liu and Johannes Schneider and Alexis Steinmann", title = "Using Neural and Graph Neural Recommender Systems to Overcome Choice Overload: Evidence From a Music Education Platform", journal = j-TOIS, volume = "42", number = "4", pages = "92:1--92:??", month = jul, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3637873", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu May 16 10:57:30 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3637873", abstract = "The application of recommendation technologies has been crucial in the promotion of physical and digital content across numerous global platforms such as Amazon, Apple, and Netflix. Our study aims to investigate the advantages of employing recommendation \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "92", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Ye:2024:RFB, author = "Ziyi Ye and Xiaohui Xie and Qingyao Ai and Yiqun Liu and Zhihong Wang and Weihang Su and Min Zhang", title = "Relevance Feedback with Brain Signals", journal = j-TOIS, volume = "42", number = "4", pages = "93:1--93:??", month = jul, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3637874", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu May 16 10:57:30 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3637874", abstract = "The Relevance Feedback (RF) process relies on accurate and real-time relevance estimation of feedback documents to improve retrieval performance. Since collecting explicit relevance annotations imposes an extra burden on the user, extensive studies have \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "93", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Chen:2024:FFA, author = "Wei Chen and Yiqing Wu and Zhao Zhang and Fuzhen Zhuang and Zhongshi He and Ruobing Xie and Feng Xia", title = "{FairGap}: Fairness-Aware Recommendation via Generating Counterfactual Graph", journal = j-TOIS, volume = "42", number = "4", pages = "94:1--94:??", month = jul, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3638352", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu May 16 10:57:30 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3638352", abstract = "The emergence of Graph Neural Networks (GNNs) has greatly advanced the development of recommendation systems. Recently, many researchers have leveraged GNN-based models to learn fair representations for users and items. However, current GNN-based models \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "94", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Vuong:2024:PRI, author = "Tung Vuong and Tuukka Ruotsalo", title = "Predicting Representations of Information Needs from Digital Activity Context", journal = j-TOIS, volume = "42", number = "4", pages = "95:1--95:??", month = jul, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3639819", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu May 16 10:57:30 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3639819", abstract = "Information retrieval systems often consider search-session and immediately preceding web-browsing history as the context for predicting users' present information needs. However, such context is only available when a user's information needs originate \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "95", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Bai:2024:IOD, author = "Yutong Bai and Yujia Zhou and Zhicheng Dou and Ji-Rong Wen", title = "Intent-Oriented Dynamic Interest Modeling for Personalized {Web} Search", journal = j-TOIS, volume = "42", number = "4", pages = "96:1--96:??", month = jul, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3639817", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu May 16 10:57:30 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3639817", abstract = "Given a user, a personalized search model relies on her historical behaviors, such as issued queries and their clicked documents, to generate an interest profile and personalize search results accordingly. In interest profiling, most existing personalized \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "96", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Liu:2024:MPP, author = "Hao Liu and Lei Guo and Lei Zhu and Yongqiang Jiang and Min Gao and Hongzhi Yin", title = "{MCRPL}: a Pretrain, Prompt, and Fine-tune Paradigm for Non-overlapping Many-to-one Cross-domain Recommendation", journal = j-TOIS, volume = "42", number = "4", pages = "97:1--97:??", month = jul, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3641860", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu May 16 10:57:30 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3641860", abstract = "Cross-domain Recommendation is the task that tends to improve the recommendations in the sparse target domain by leveraging the information from other rich domains. Existing methods of cross-domain recommendation mainly focus on overlapping scenarios by \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "97", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wu:2024:ESS, author = "Jiancan Wu and Xiang Wang and Xingyu Gao and Jiawei Chen and Hongcheng Fu and Tianyu Qiu", title = "On the Effectiveness of Sampled Softmax Loss for Item Recommendation", journal = j-TOIS, volume = "42", number = "4", pages = "98:1--98:??", month = jul, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3637061", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu May 16 10:57:30 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3637061", abstract = "The learning objective plays a fundamental role to build a recommender system. Most methods routinely adopt either pointwise (e.g., binary cross-entropy) or pairwise (e.g., BPR) loss to train the model parameters, while rarely pay attention to softmax \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "98", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Lalor:2024:SFM, author = "John P. Lalor and Ahmed Abbasi and Kezia Oketch and Yi Yang and Nicole Forsgren", title = "Should Fairness be a Metric or a Model? {A} Model-based Framework for Assessing Bias in Machine Learning Pipelines", journal = j-TOIS, volume = "42", number = "4", pages = "99:1--99:??", month = jul, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3641276", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu May 16 10:57:30 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3641276", abstract = "Fairness measurement is crucial for assessing algorithmic bias in various types of machine learning (ML) models, including ones used for search relevance, recommendation, personalization, talent analytics, and natural language processing. However, the \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "99", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Ma:2024:MMV, author = "Yunshan Ma and Yingzhi He and Xiang Wang and Yinwei Wei and Xiaoyu Du and Yuyangzi Fu and Tat-Seng Chua", title = "{MultiCBR}: Multi-view Contrastive Learning for Bundle Recommendation", journal = j-TOIS, volume = "42", number = "4", pages = "100:1--100:??", month = jul, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3640810", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu May 16 10:57:30 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3640810", abstract = "Bundle recommendation seeks to recommend a bundle of related items to users to improve both user experience and the profits of platform. Existing bundle recommendation models have progressed from capturing only user-bundle interactions to the modeling of \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "100", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Cheng:2024:CPH, author = "Jiezhu Cheng and Kaizhu Huang and Zibin Zheng", title = "Can Perturbations Help Reduce Investment Risks? {Risk}-aware Stock Recommendation via Split Variational Adversarial Training", journal = j-TOIS, volume = "42", number = "4", pages = "101:1--101:??", month = jul, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3643131", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu May 16 10:57:30 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3643131", abstract = "In the stock market, a successful investment requires a good balance between profits and risks. Based on the learning to rank paradigm, stock recommendation has been widely studied in quantitative finance to recommend stocks with higher return ratios for \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "101", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Che:2024:TIE, author = "Shangkun Che and Hongyan Liu and Shen Liu", title = "Tagging Items with Emerging Tags: a Neural Topic Model Based Few-Shot Learning Approach", journal = j-TOIS, volume = "42", number = "4", pages = "102:1--102:??", month = jul, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3641859", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu May 16 10:57:30 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3641859", abstract = "The tagging system has become a primary tool to organize information resources on the Internet, which benefits both users and the platforms. To build a successful tagging system, automatic tagging methods are desired. With the development of society, new \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "102", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2024:TCM, author = "Shengyu Zhang and Qiaowei Miao and Ping Nie and Mengze Li and Zhengyu Chen and Fuli Feng and Kun Kuang and Fei Wu", title = "Transferring Causal Mechanism over Meta-representations for Target-Unknown Cross-domain Recommendation", journal = j-TOIS, volume = "42", number = "4", pages = "103:1--103:??", month = jul, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3643807", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu May 16 10:57:30 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3643807", abstract = "Tackling the pervasive issue of data sparsity in recommender systems, we present an insightful investigation into the burgeoning area of non-overlapping cross-domain recommendation, a technique that facilitates the transfer of interaction knowledge across \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "103", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wan:2024:TER, author = "Qizhi Wan and Changxuan Wan and Keli Xiao and Hui Xiong and Dexi Liu and Xiping Liu and Rong Hu", title = "Token-Event-Role Structure-Based Multi-Channel Document-Level Event Extraction", journal = j-TOIS, volume = "42", number = "4", pages = "104:1--104:??", month = jul, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3643885", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu May 16 10:57:30 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3643885", abstract = "Document-level event extraction is a long-standing challenging information retrieval problem involving a sequence of sub-tasks: entity extraction, event type judgment, and event type-specific multi-event extraction. However, addressing the problem as \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "104", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Li:2024:MML, author = "Shuzhe Li and Wei Chen and Bin Wang and Chao Huang and Yanwei Yu and Junyu Dong", title = "{MCN4Rec}: Multi-level Collaborative Neural Network for Next Location Recommendation", journal = j-TOIS, volume = "42", number = "4", pages = "105:1--105:??", month = jul, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3643669", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu May 16 10:57:30 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3643669", abstract = "Next location recommendation plays an important role in various location-based services, yielding great value for both users and service providers. Existing methods usually model temporal dependencies with explicit time intervals or learn representation \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "105", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wang:2024:CEF, author = "Xiangmeng Wang and Qian Li and Dianer Yu and Qing Li and Guandong Xu", title = "Counterfactual Explanation for Fairness in Recommendation", journal = j-TOIS, volume = "42", number = "4", pages = "106:1--106:??", month = jul, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3643670", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu May 16 10:57:30 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3643670", abstract = "Fairness-aware recommendation alleviates discrimination issues to build trustworthy recommendation systems. Explaining the causes of unfair recommendations is critical, as it promotes fairness diagnostics, and thus secures users' trust in recommendation \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "106", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Fang:2024:FSL, author = "Yang Fang and Xiang Zhao and Weidong Xiao and Maarten de Rijke", title = "Few-shot Learning for Heterogeneous Information Networks", journal = j-TOIS, volume = "42", number = "4", pages = "107:1--107:??", month = jul, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3649311", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu May 16 10:57:30 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3649311", abstract = "Heterogeneous information networks (HINs) are a key resource in many domain-specific retrieval and recommendation scenarios and in conversational environments. Current approaches to mining graph data often rely on abundant supervised information. However, \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "107", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Li:2024:FBS, author = "Jun Li and Yi Bin and Yunshan Ma and Yang Yang and Zi Huang and Tat-Seng Chua", title = "Filter-based Stance Network for Rumor Verification", journal = j-TOIS, volume = "42", number = "4", pages = "108:1--108:??", month = jul, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3649462", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu May 16 10:57:30 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3649462", abstract = "Rumor verification on social media aims to identify the truth value of a rumor, which is important to decrease the detrimental public effects. A rumor might arouse heated discussions and replies, conveying different stances of users that could be helpful \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "108", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Li:2024:ISS, author = "Shujie Li and Guanghu Yuan and Min Yang and Ying Shen and Chengming Li and Ruifeng Xu and Xiaoyan Zhao", title = "Improving Semi-Supervised Text Classification with Dual Meta-Learning", journal = j-TOIS, volume = "42", number = "4", pages = "109:1--109:??", month = jul, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3648612", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu May 16 10:57:30 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3648612", abstract = "The goal of semi-supervised text classification (SSTC) is to train a model by exploring both a small number of labeled data and a large number of unlabeled data, such that the learned semi-supervised classifier performs better than the supervised \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "109", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zha:2024:TUR, author = "Rui Zha and Ying Sun and Chuan Qin and Le Zhang and Tong Xu and Hengshu Zhu and Enhong Chen", title = "Towards Unified Representation Learning for Career Mobility Analysis with Trajectory Hypergraph", journal = j-TOIS, volume = "42", number = "4", pages = "110:1--110:??", month = jul, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3651158", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu May 16 10:57:30 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3651158", abstract = "Career mobility analysis aims at understanding the occupational movement patterns of talents across distinct labor market entities, which enables a wide range of talent-centered applications, such as job recommendation, labor demand forecasting, and \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "110", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wang:2024:IBB, author = "Tianshi Wang and Fengling Li and Lei Zhu and Jingjing Li and Zheng Zhang and Heng Tao Shen", title = "Invisible Black-Box Backdoor Attack against Deep Cross-Modal Hashing Retrieval", journal = j-TOIS, volume = "42", number = "4", pages = "111:1--111:??", month = jul, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3650205", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu May 16 10:57:30 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3650205", abstract = "Deep cross-modal hashing has promoted the field of multi-modal retrieval due to its excellent efficiency and storage, but its vulnerability to backdoor attacks is rarely studied. Notably, current deep cross-modal hashing methods inevitably require large-. \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "111", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Pu:2024:EEL, author = "Yanjun Pu and Fang Liu and Rongye Shi and Haitao Yuan and Ruibo Chen and Tianhao Peng and Wenjun Wu", title = "{ELAKT}: Enhancing Locality for Attentive Knowledge Tracing", journal = j-TOIS, volume = "42", number = "4", pages = "112:1--112:??", month = jul, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3652601", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Thu May 16 10:57:30 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3652601", abstract = "Knowledge tracing models based on deep learning can achieve impressive predictive performance by leveraging attention mechanisms. However, there still exist two challenges in attentive knowledge tracing (AKT): First, the mechanism of classical models of \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "112", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Bruch:2024:SSE, author = "Sebastian Bruch and Claudio Lucchese and Maria Maistro and Franco Maria Nardini", title = "Special Section on Efficiency in Neural Information Retrieval", journal = j-TOIS, volume = "42", number = "5", pages = "113:1--113:??", month = sep, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3641203", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue Jun 4 06:03:40 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3641203", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "113", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Rau:2024:RBW, author = "David Rau and Mostafa Dehghani and Jaap Kamps", title = "Revisiting Bag of Words Document Representations for Efficient Ranking with Transformers", journal = j-TOIS, volume = "42", number = "5", pages = "114:1--114:??", month = sep, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3640460", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue Jun 4 06:03:40 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3640460", abstract = "Modern transformer-based information retrieval models achieve state-of-the-art performance across various benchmarks. The self-attention of the transformer models is a powerful mechanism to contextualize terms over the whole input but quickly becomes \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "114", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Askari:2024:REL, author = "Arian Askari and Suzan Verberne and Amin Abolghasemi and Wessel Kraaij and Gabriella Pasi", title = "Retrieval for Extremely Long Queries and Documents with {RPRS}: a Highly Efficient and Effective Transformer-based Re-Ranker", journal = j-TOIS, volume = "42", number = "5", pages = "115:1--115:??", month = sep, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3631938", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue Jun 4 06:03:40 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3631938", abstract = "Retrieval with extremely long queries and documents is a well-known and challenging task in information retrieval and is commonly known as Query-by-Document (QBD) retrieval. Specifically designed Transformer models that can handle long input sequences \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "115", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Formal:2024:TEE, author = "Thibault Formal and Carlos Lassance and Benjamin Piwowarski and St{\'e}phane Clinchant", title = "Towards Effective and Efficient Sparse Neural Information Retrieval", journal = j-TOIS, volume = "42", number = "5", pages = "116:1--116:??", month = sep, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3634912", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue Jun 4 06:03:40 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3634912", abstract = "Sparse representation learning based on Pre-trained Language Models has seen a growing interest in Information Retrieval. Such approaches can take advantage of the proven efficiency of inverted indexes and inherit desirable IR priors such as explicit \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "116", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Leonhardt:2024:ENR, author = "Jurek Leonhardt and Henrik M{\"u}ller and Koustav Rudra and Megha Khosla and Abhijit Anand and Avishek Anand", title = "Efficient Neural Ranking Using Forward Indexes and Lightweight Encoders", journal = j-TOIS, volume = "42", number = "5", pages = "117:1--117:??", month = sep, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3631939", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue Jun 4 06:03:40 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3631939", abstract = "Dual-encoder-based dense retrieval models have become the standard in IR. They employ large Transformer-based language models, which are notoriously inefficient in terms of resources and latency. We propose Fast-Forward indexes-vector forward indexes \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "117", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Liu:2024:AMM, author = "Qi Liu and Gang Guo and Jiaxin Mao and Zhicheng Dou and Ji-Rong Wen and Hao Jiang and Xinyu Zhang and Zhao Cao", title = "An Analysis on Matching Mechanisms and Token Pruning for Late-interaction Models", journal = j-TOIS, volume = "42", number = "5", pages = "118:1--118:??", month = sep, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3639818", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue Jun 4 06:03:40 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3639818", abstract = "With the development of pre-trained language models, the dense retrieval models have become promising alternatives to the traditional retrieval models that rely on exact match and sparse bag-of-words representations. Different from most dense retrieval \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "118", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Anand:2024:DAS, author = "Abhijit Anand and Jurek Leonhardt and Jaspreet Singh and Koustav Rudra and Avishek Anand", title = "Data Augmentation for Sample Efficient and Robust Document Ranking", journal = j-TOIS, volume = "42", number = "5", pages = "119:1--119:??", month = sep, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3634911", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue Jun 4 06:03:40 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3634911", abstract = "Contextual ranking models have delivered impressive performance improvements over classical models in the document ranking task. However, these highly over-parameterized models tend to be data-hungry and require large amounts of data even for fine-tuning. \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "119", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Yan:2024:TEM, author = "Surong Yan and Chenglong Shi and Haosen Wang and Lei Chen and Ling Jiang and Ruilin Guo and Kwei-Jay Lin", title = "Teach and Explore: a Multiplex Information-guided Effective and Efficient Reinforcement Learning for Sequential Recommendation", journal = j-TOIS, volume = "42", number = "5", pages = "120:1--120:??", month = sep, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3630003", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue Jun 4 06:03:40 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3630003", abstract = "Casting sequential recommendation (SR) as a reinforcement learning (RL) problem is promising and some RL-based methods have been proposed for SR. However, these models are sub-optimal due to the following limitations: (a) they fail to leverage the \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "120", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Lien:2024:GWS, author = "Yen-Chieh Lien and Hamed Zamani and Bruce Croft", title = "Generalized Weak Supervision for Neural Information Retrieval", journal = j-TOIS, volume = "42", number = "5", pages = "121:1--121:??", month = sep, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3647639", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue Jun 4 06:03:40 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3647639", abstract = "Neural ranking models (NRMs) have demonstrated effective performance in several information retrieval (IR) tasks. However, training NRMs often requires large-scale training data, which is difficult and expensive to obtain. To address this issue, one can \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "121", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Frummet:2024:CCE, author = "Alexander Frummet and Alessandro Speggiorin and David Elsweiler and Anton Leuski and Jeff Dalton", title = "Cooking with Conversation: Enhancing User Engagement and Learning with a Knowledge-Enhancing Assistant", journal = j-TOIS, volume = "42", number = "5", pages = "122:1--122:??", month = sep, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3649500", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue Jun 4 06:03:40 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3649500", abstract = "We present two empirical studies to investigate users' expectations and behaviours when using digital assistants, such as Alexa and Google Home, in a kitchen context: First, a survey (N = 200) queries participants on their expectations for the kinds of \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "122", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhu:2024:CMC, author = "Yunchang Zhu and Liang Pang and Kangxi Wu and Yanyan Lan and Huawei Shen and Xueqi Cheng", title = "Cross-Model Comparative Loss for Enhancing Neuronal Utility in Language Understanding", journal = j-TOIS, volume = "42", number = "5", pages = "123:1--123:??", month = sep, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3652599", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue Jun 4 06:03:40 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3652599", abstract = "Current natural language understanding (NLU) models have been continuously scaling up, both in terms of model size and input context, introducing more hidden and input neurons. While this generally improves performance on average, the extra neurons do not \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "123", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wang:2024:TCB, author = "Jian Wang and Dongding Lin and Wenjie Li", title = "Target-constrained Bidirectional Planning for Generation of Target-oriented Proactive Dialogue", journal = j-TOIS, volume = "42", number = "5", pages = "124:1--124:??", month = sep, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3652598", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue Jun 4 06:03:40 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3652598", abstract = "Target-oriented proactive dialogue systems aim at leading conversations from a dialogue context toward a pre-determined target, such as making recommendations on designated items or introducing new specific topics. To this end, it is critical for such \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "124", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Yang:2024:DFM, author = "Enyue Yang and Weike Pan and Qiang Yang and Zhong Ming", title = "Discrete Federated Multi-behavior Recommendation for Privacy-Preserving Heterogeneous One-Class Collaborative Filtering", journal = j-TOIS, volume = "42", number = "5", pages = "125:1--125:??", month = sep, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3652853", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue Jun 4 06:03:40 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3652853", abstract = "Recently, federated recommendation has become a research hotspot mainly because of users' awareness of privacy in data. As a recent and important recommendation problem, in heterogeneous one-class collaborative filtering (HOCCF), each user may involve of \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "125", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Deng:2024:MGD, author = "Zhirui Deng and Zhicheng Dou and Zhan Su and Ji-Rong Wen", title = "Multi-grained Document Modeling for Search Result Diversification", journal = j-TOIS, volume = "42", number = "5", pages = "126:1--126:??", month = sep, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3652852", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue Jun 4 06:03:40 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3652852", abstract = "Search result diversification plays a crucial role in improving users' search experience by providing users with documents covering more subtopics. Previous studies have made great progress in leveraging inter-document interactions to measure the \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "126", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Yi:2024:DCN, author = "Kun Yi and Qi Zhang and Hui He and Kaize Shi and Liang Hu and Ning An and Zhendong Niu", title = "Deep Coupling Network for Multivariate Time Series Forecasting", journal = j-TOIS, volume = "42", number = "5", pages = "127:1--127:??", month = sep, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3653447", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue Jun 4 06:03:40 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3653447", abstract = "Multivariate time series (MTS) forecasting is crucial in many real-world applications. To achieve accurate MTS forecasting, it is essential to simultaneously consider both intra- and inter-series relationships among time series data. However, previous \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "127", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Li:2024:BRF, author = "Hanzhe Li and Jingjing Gu and Xinjiang Lu and Dazhong Shen and Yuting Liu and YaNan Deng and Guoliang Shi and Hui Xiong", title = "Beyond Relevance: Factor-level Causal Explanation for User Travel Decisions with Counterfactual Data Augmentation", journal = j-TOIS, volume = "42", number = "5", pages = "128:1--128:??", month = sep, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3653673", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue Jun 4 06:03:40 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3653673", abstract = "Point-of-Interest (POI) recommendation, an important research hotspot in the field of urban computing, plays a crucial role in urban construction. While understanding the process of users' travel decisions and exploring the causality of POI choosing is \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "128", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Tang:2024:DRD, author = "Xing Tang and Ling Chen and Hongyu Shi and Dandan Lyu", title = "{DHyper}: a Recurrent Dual Hypergraph Neural Network for Event Prediction in Temporal Knowledge Graphs", journal = j-TOIS, volume = "42", number = "5", pages = "129:1--129:??", month = sep, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3653015", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue Jun 4 06:03:40 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3653015", abstract = "Event prediction is a vital and challenging task in temporal knowledge graphs (TKGs), which have played crucial roles in various applications. Recently, many graph neural networks based approaches are proposed to model the graph structure information in \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "129", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Chen:2024:SSP, author = "Junfan Chen and Richong Zhang and Xiaohan Jiang and Chunming Hu", title = "{SPContrastNet}: a Self-Paced Contrastive Learning Model for Few-Shot Text Classification", journal = j-TOIS, volume = "42", number = "5", pages = "130:1--130:??", month = sep, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3652600", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue Jun 4 06:03:40 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3652600", abstract = "Meta-learning has recently promoted few-shot text classification, which identifies target classes based on information transferred from source classes through a series of small tasks or episodes. Existing works constructing their meta-learner on \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "130", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Yang:2024:DFA, author = "Hao Yang and Xian Wu and Zhaopeng Qiu and Yefeng Zheng and Xu Chen", title = "Distributional Fairness-aware Recommendation", journal = j-TOIS, volume = "42", number = "5", pages = "131:1--131:??", month = sep, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3652854", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue Jun 4 06:03:40 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3652854", abstract = "Fairness has been gradually recognized as a significant problem in the recommendation domain. Previous models usually achieve fairness by reducing the average performance gap between different user groups. However, the average performance may not \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "131", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Shi:2024:DSR, author = "Chaoyu Shi and Pengjie Ren and Dongjie Fu and Xin Xin and Shansong Yang and Fei Cai and Zhaochun Ren and Zhumin Chen", title = "Diversifying Sequential Recommendation with Retrospective and Prospective Transformers", journal = j-TOIS, volume = "42", number = "5", pages = "132:1--132:??", month = sep, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3653016", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue Jun 4 06:03:40 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3653016", abstract = "Previous studies on sequential recommendation (SR) have predominantly concentrated on optimizing recommendation accuracy. However, there remains a significant gap in enhancing recommendation diversity, particularly for short interaction sequences. The \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "132", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Tang:2024:LGR, author = "Yubao Tang and Ruqing Zhang and Jiafeng Guo and Maarten de Rijke and Wei Chen and Xueqi Cheng", title = "Listwise Generative Retrieval Models via a Sequential Learning Process", journal = j-TOIS, volume = "42", number = "5", pages = "133:1--133:??", month = sep, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3653712", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue Jun 4 06:03:40 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3653712", abstract = "Recently, a novel generative retrieval (GR) paradigm has been proposed, where a single sequence-to-sequence model is learned to directly generate a list of relevant document identifiers (docids) given a query. Existing GR models commonly employ maximum \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "133", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wen:2024:PAE, author = "Zhiyuan Wen and Jiannong Cao and Jiaxing Shen and Ruosong Yang and Shuaiqi Liu and Maosong Sun", title = "Personality-affected Emotion Generation in Dialog Systems", journal = j-TOIS, volume = "42", number = "5", pages = "134:1--134:??", month = sep, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3655616", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue Jun 4 06:03:40 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3655616", abstract = "Generating appropriate emotions for responses is essential for dialogue systems to provide human-like interaction in various application scenarios. Most previous dialogue systems tried to achieve this goal by learning empathetic manners from anonymous \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "134", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Tian:2024:PPC, author = "Changxin Tian and Yuexiang Xie and Xu Chen and Yaliang Li and Xin Zhao", title = "Privacy-preserving Cross-domain Recommendation with Federated Graph Learning", journal = j-TOIS, volume = "42", number = "5", pages = "135:1--135:??", month = sep, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3653448", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue Jun 4 06:03:40 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3653448", abstract = "As people inevitably interact with items across multiple domains or various platforms, cross-domain recommendation (CDR) has gained increasing attention. However, the rising privacy concerns limit the practical applications of existing CDR models, since \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "135", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Su:2024:PAS, author = "Zhan Su and Zhicheng Dou and Yutao Zhu and Ji-Rong Wen", title = "Passage-aware Search Result Diversification", journal = j-TOIS, volume = "42", number = "5", pages = "136:1--136:??", month = sep, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3653672", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue Jun 4 06:03:40 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3653672", abstract = "Research on search result diversification strives to enhance the variety of subtopics within the list of search results. Existing studies usually treat a document as a whole and represent it with one fixed-length vector. However, considering that a long \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "136", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2024:CDN, author = "Xinghua Zhang and Bowen Yu and Xin Cong and Taoyu Su and Quangang Li and Tingwen Liu and Hongbo Xu", title = "Cross-Domain {NER} under a Divide-and-Transfer Paradigm", journal = j-TOIS, volume = "42", number = "5", pages = "137:1--137:??", month = sep, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3655618", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue Jun 4 06:03:40 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3655618", abstract = "Cross-domain Named Entity Recognition (NER) transfers knowledge learned from a rich-resource source domain to improve the learning in a low-resource target domain. Most existing works are designed based on the sequence labeling framework, defining entity \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "137", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2024:SSN, author = "Yuxiang Zhang and Junjie Wang and Xinyu Zhu and Tetsuya Sakai and Hayato Yamana", title = "{SSR}: Solving Named Entity Recognition Problems via a Single-stream Reasoner", journal = j-TOIS, volume = "42", number = "5", pages = "138:1--138:??", month = sep, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3655619", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue Jun 4 06:03:40 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3655619", abstract = "Information Extraction (IE) focuses on transforming unstructured data into structured knowledge, of which Named Entity Recognition (NER) is a fundamental component. In the realm of Information Retrieval (IR), effectively recognizing entities can \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "138", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Liu:2024:FTI, author = "Fei Liu and Chenyang Bu and Haotian Zhang and Le Wu and Kui Yu and Xuegang Hu", title = "{FDKT}: Towards an Interpretable Deep Knowledge Tracing via Fuzzy Reasoning", journal = j-TOIS, volume = "42", number = "5", pages = "139:1--139:??", month = sep, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3656167", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue Jun 4 06:03:40 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3656167", abstract = "In educational data mining, knowledge tracing (KT) aims to model learning performance based on student knowledge mastery. Deep-learning-based KT models perform remarkably better than traditional KT and have attracted considerable attention. However, most \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "139", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Shao:2024:AUS, author = "Pengyang Shao and Le Wu and Kun Zhang and Defu Lian and Richang Hong and Yong Li and Meng Wang", title = "Average User-Side Counterfactual Fairness for Collaborative Filtering", journal = j-TOIS, volume = "42", number = "5", pages = "140:1--140:??", month = sep, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3656639", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue Jun 4 06:03:40 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3656639", abstract = "Recently, the user-side fairness issue in Collaborative Filtering (CF) algorithms has gained considerable attention, arguing that results should not discriminate an individual or a sub-user group based on users' sensitive attributes (e.g., gender). \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "140", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Luo:2024:CSR, author = "Tianze Luo and Yong Liu and Sinno Jialin Pan", title = "Collaborative Sequential Recommendations via Multi-view {GNN}-transformers", journal = j-TOIS, volume = "42", number = "6", pages = "141:1--141:??", month = nov, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3649436", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Oct 23 06:02:05 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3649436", abstract = "Sequential recommendation systems aim to exploit users' sequential behavior patterns to capture their interaction intentions and improve recommendation accuracy. Existing sequential recommendation methods mainly focus on modeling the items' chronological \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "141", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wang:2024:TBA, author = "Zhidan Wang and Lixin Zou and Chenliang Li and Shuaiqiang Wang and Xu Chen and Dawei Yin and Weidong Liu", title = "Toward Bias-Agnostic Recommender Systems: a Universal Generative Framework", journal = j-TOIS, volume = "42", number = "6", pages = "142:1--142:??", month = nov, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3655617", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Oct 23 06:02:05 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3655617", abstract = "User behavior data, such as ratings and clicks, has been widely used to build personalizing models for recommender systems. However, many unflattering factors (e.g., popularity, ranking position, users' selection) significantly affect the performance of \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "142", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wang:2024:DLR, author = "Quan Wang and Zhendong Mao and Jie Gao and Yongdong Zhang", title = "Document-level Relation Extraction with Progressive Self-distillation", journal = j-TOIS, volume = "42", number = "6", pages = "143:1--143:??", month = nov, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3656168", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Oct 23 06:02:05 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3656168", abstract = "Document-level relation extraction (RE) aims to simultaneously predict relations (including no-relation cases denoted as NA) between all entity pairs in a document. It is typically formulated as a relation classification task with entities pre-detected in \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "143", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhuo:2024:MHM, author = "Xingrui Zhuo and Shengsheng Qian and Jun Hu and Fuxin Dai and Kangyi Lin and Gongqing Wu", title = "Multi-Hop Multi-View Memory Transformer for Session-Based Recommendation", journal = j-TOIS, volume = "42", number = "6", pages = "144:1--144:??", month = nov, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3663760", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Oct 23 06:02:05 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3663760", abstract = "A Session-Based Recommendation (SBR) seeks to predict users' future item preferences by analyzing their interactions with previously clicked items. In recent approaches, Graph Neural Networks (GNNs) have been commonly applied to capture item relations \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "144", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zeng:2024:XLS, author = "Kaisheng Zeng and Hailong Jin and Xin Lv and Fangwei Zhu and Lei Hou and Yi Zhang and Fan Pang and Yu Qi and Dingxiao Liu and Juanzi Li and Ling Feng", title = "{XLORE 3}: a Large-Scale Multilingual Knowledge Graph from Heterogeneous {Wiki} Knowledge Resources", journal = j-TOIS, volume = "42", number = "6", pages = "145:1--145:??", month = nov, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3660521", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Oct 23 06:02:05 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3660521", abstract = "In recent years, knowledge graph (KG) has attracted significant attention from academia and industry, resulting in the development of numerous technologies for KG construction, completion, and application. XLORE is one of the largest multilingual KGs \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "145", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wang:2024:MRC, author = "Yanan Wang and Yong Ge and Zhepeng Li and Li Li and Rui Chen", title = "{M$^3$Rec}: a Context-Aware Offline Meta-Level Model-Based Reinforcement Learning Approach for Cold-Start Recommendation", journal = j-TOIS, volume = "42", number = "6", pages = "146:1--146:??", month = nov, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3659947", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Oct 23 06:02:05 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3659947", abstract = "Reinforcement learning (RL) has shown great promise in optimizing long-term user interest in recommender systems. However, existing RL-based recommendation methods need a large number of interactions for each user to learn the recommendation policy. The \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "146", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Shi:2024:UGN, author = "Chuan Shi and Meiqi Zhu and Yue Yu and Xiao Wang and Junping Du", title = "Unifying Graph Neural Networks with a Generalized Optimization Framework", journal = j-TOIS, volume = "42", number = "6", pages = "147:1--147:??", month = nov, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3660852", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Oct 23 06:02:05 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3660852", abstract = "Graph Neural Networks (GNNs) have received considerable attention on graph-structured data learning for a wide variety of tasks. The well-designed propagation mechanism, which has been demonstrated effective, is the most fundamental part of GNNs. Although \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "147", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Peng:2024:USB, author = "Hao Peng and Jingyun Zhang and Xiang Huang and Zhifeng Hao and Angsheng Li and Zhengtao Yu and Philip S. Yu", title = "Unsupervised Social Bot Detection via Structural Information Theory", journal = j-TOIS, volume = "42", number = "6", pages = "148:1--148:??", month = nov, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3660522", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Oct 23 06:02:05 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3660522", abstract = "Research on social bot detection plays a crucial role in maintaining the order and reliability of information dissemination while increasing trust in social interactions. The current mainstream social bot detection models rely on black-box neural network \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "148", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Shi:2024:BTN, author = "Haitao Shi and Meng Liu and Xiaoxuan Mu and Xuemeng Song and Yupeng Hu and Liqiang Nie", title = "Breaking Through the Noisy Correspondence: a Robust Model for Image-Text Matching", journal = j-TOIS, volume = "42", number = "6", pages = "149:1--149:??", month = nov, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3662732", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Oct 23 06:02:05 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3662732", abstract = "Unleashing the power of image-text matching in real-world applications is hampered by noisy correspondence. Manually curating high-quality datasets is expensive and time-consuming, and datasets generated using diffusion models are not adequately well-. \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "149", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Chen:2024:OCO, author = "Xiaocong Chen and Siyu Wang and Julian McAuley and Dietmar Jannach and Lina Yao", title = "On the Opportunities and Challenges of Offline Reinforcement Learning for Recommender Systems", journal = j-TOIS, volume = "42", number = "6", pages = "150:1--150:??", month = nov, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3661996", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Oct 23 06:02:05 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3661996", abstract = "Reinforcement learning serves as a potent tool for modeling dynamic user interests within recommender systems, garnering increasing research attention of late. However, a significant drawback persists: its poor data efficiency, stemming from its \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "150", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Bruch:2024:BDS, author = "Sebastian Bruch and Franco Maria Nardini and Amir Ingber and Edo Liberty", title = "Bridging Dense and Sparse Maximum Inner Product Search", journal = j-TOIS, volume = "42", number = "6", pages = "151:1--151:??", month = nov, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3665324", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Oct 23 06:02:05 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3665324", abstract = "Maximum inner product search (MIPS) over dense and sparse vectors have progressed independently in a bifurcated literature for decades; the latter is better known as top- \(k\) retrieval in Information Retrieval. This duality exists because sparse and \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "151", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{An:2024:MMV, author = "Jingmin An and Ming Gao and Jiafu Tang", title = "{MvStHgL}: Multi-View Hypergraph Learning with Spatial-Temporal Periodic Interests for Next {POI} Recommendation", journal = j-TOIS, volume = "42", number = "6", pages = "152:1--152:??", month = nov, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3664651", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Oct 23 06:02:05 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3664651", abstract = "Providing potential next point-of-interest (POI) suggestions for users has become a prominent task in location-based social networks, which receives more and more attention from the industry and academia and it remains challenging due to highly dynamic \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "152", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Sun:2024:CMD, author = "KE Sun and Chenliang Li and Tieyun Qian", title = "City Matters! {A} Dual-Target Cross-City Sequential {POI} Recommendation Model", journal = j-TOIS, volume = "42", number = "6", pages = "153:1--153:??", month = nov, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3664284", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Oct 23 06:02:05 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3664284", abstract = "Existing sequential Point of Interest (POI) recommendation methods overlook a fact that each city exhibits distinct characteristics and totally ignore the city signature. In this study, we claim that city matters in sequential POI recommendation and fully \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "153", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2024:SCS, author = "Yabin Zhang and Zhenlei Wang and Wenhui Yu and Lantao Hu and Peng Jiang and Kun Gai and Xu Chen", title = "Soft Contrastive Sequential Recommendation", journal = j-TOIS, volume = "42", number = "6", pages = "154:1--154:??", month = nov, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3665325", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Oct 23 06:02:05 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3665325", abstract = "Contrastive learning has recently emerged as an effective strategy for improving the performance of sequential recommendation. However, traditional models commonly construct the contrastive loss by directly optimizing human-designed positive and negative \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "154", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhou:2024:RRO, author = "Yujia Zhou and Jing Yao and Zhicheng Dou and Yiteng Tu and Ledell Wu and Tat-Seng Chua and Ji-Rong Wen", title = "{ROGER}: Ranking-Oriented Generative Retrieval", journal = j-TOIS, volume = "42", number = "6", pages = "155:1--155:??", month = nov, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3603167", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Oct 23 06:02:05 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3603167", abstract = "In recent years, various dense retrieval methods have been developed to improve the performance of search engines with a vectorized index. However, these approaches require a large pre-computed index and have a limited capacity to memorize all semantics \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "155", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Chen:2024:AIP, author = "Lijian Chen and Wei Yuan and Tong Chen and Guanhua Ye and Nguyen Quoc Viet Hung and Hongzhi Yin", title = "Adversarial Item Promotion on Visually-Aware Recommender Systems by Guided Diffusion", journal = j-TOIS, volume = "42", number = "6", pages = "156:1--156:??", month = nov, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3666088", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Oct 23 06:02:05 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3666088", abstract = "Visually-aware recommender systems have found widespread applications in domains where visual elements significantly contribute to the inference of users' potential preferences. While the incorporation of visual information holds the promise of enhancing \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "156", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Jiang:2024:TFM, author = "Yiheng Jiang and Yuanbo Xu and Yongjian Yang and Funing Yang and Pengyang Wang and Chaozhuo Li and Fuzhen Zhuang and Hui Xiong", title = "{TriMLP}: a Foundational {MLP}-Like Architecture for Sequential Recommendation", journal = j-TOIS, volume = "42", number = "6", pages = "157:1--157:??", month = nov, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3670995", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Oct 23 06:02:05 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3670995", abstract = "In this work, we present TriMLP as a foundational MLP-like architecture for the sequential recommendation, simultaneously achieving computational efficiency and promising performance. First, we empirically study the incompatibility between existing purely \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "157", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Lin:2024:RRC, author = "Siyi Lin and Sheng Zhou and Jiawei Chen and Yan Feng and Qihao Shi and Chun Chen and Ying Li and Can Wang", title = "{ReCRec}: Reasoning the Causes of Implicit Feedback for Debiased Recommendation", journal = j-TOIS, volume = "42", number = "6", pages = "158:1--158:??", month = nov, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3672275", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Oct 23 06:02:05 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3672275", abstract = "Implicit feedback (e.g., user clicks) is widely used in building recommender systems (RS). However, the inherent notorious exposure bias significantly affects recommendation performance. Exposure bias refers a phenomenon that implicit feedback is \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "158", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Fan:2024:OMA, author = "Yu-Chen Fan and Yitong Ji and Jie Zhang and Aixin Sun", title = "Our Model Achieves Excellent Performance on {MovieLens}: What Does It Mean?", journal = j-TOIS, volume = "42", number = "6", pages = "159:1--159:??", month = nov, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3675163", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Oct 23 06:02:05 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3675163", abstract = "A typical benchmark dataset for recommender system (RecSys) evaluation consists of user-item interactions generated on a platform within a time period. The interaction generation mechanism partially explains why a user interacts with (e.g., like, purchase,. \ldots{})", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "159", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zou:2024:ATL, author = "Tao Zou and Le Yu and Junchen Ye and Leilei Sun and Bowen Du and Deqing Wang", title = "Adaptive Taxonomy Learning and Historical Patterns Modeling for Patent Classification", journal = j-TOIS, volume = "42", number = "6", pages = "160:1--160:??", month = nov, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3674834", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Oct 23 06:02:05 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3674834", abstract = "Patent classification aims to assign multiple International Patent Classification (IPC) codes to a given patent. Existing methods for automated patent classification primarily focus on analyzing the text descriptions of patents. However, apart from the \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "160", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2024:ELM, author = "Chen Zhang and Benyou Wang and Dawei Song", title = "On Elastic Language Models", journal = j-TOIS, volume = "42", number = "6", pages = "161:1--161:??", month = nov, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3677375", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Oct 23 06:02:05 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3677375", abstract = "Large-scale pretrained language models have achieved compelling performance in a wide range of language understanding and information retrieval tasks. While their large scales ensure capacity, they also hinder deployment. Knowledge distillation offers an \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "161", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zou:2024:KEC, author = "Jie Zou and Aixin Sun and Cheng Long and Evangelos Kanoulas", title = "Knowledge-Enhanced Conversational Recommendation via Transformer-Based Sequential Modeling", journal = j-TOIS, volume = "42", number = "6", pages = "162:1--162:??", month = nov, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3677376", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Oct 23 06:02:05 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3677376", abstract = "In conversational recommender systems (CRSs), conversations usually involve a set of items and item-related entities or attributes, e.g., director is a related entity of a movie. These items and item-related entities are often mentioned along the \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "162", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Xu:2024:DCL, author = "Jingyun Xu and Junnan Yu and Yi Cai and Tat-Seng Chua", title = "Dual Contrastive Learning for Cross-Domain Named Entity Recognition", journal = j-TOIS, volume = "42", number = "6", pages = "163:1--163:??", month = nov, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3678879", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Oct 23 06:02:05 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3678879", abstract = "Benefiting many information retrieval applications, named entity recognition (NER) has shown impressive progress. Recently, there has been a growing trend to decompose complex NER tasks into two subtasks (e.g., entity span detection (ESD) and entity type \ldots{})", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "163", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Jarvelin:2024:BIE, author = "Kalervo Jarvelin and Eero Sormunen", title = "A Blueprint of {IR} Evaluation Integrating Task and User Characteristics", journal = j-TOIS, volume = "42", number = "6", pages = "164:1--164:??", month = nov, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3675162", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Oct 23 06:02:05 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3675162", abstract = "Traditional search result evaluation metrics in information retrieval, such as MAP and NDCG, naively focus on topical relevance between a document and search topic and assume this relationship as mono-dimensional and often binary. They neglect document \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "164", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Pei:2024:MLR, author = "Jiahuan Pei and Guojun Yan and Maarten {De Rijke} and Pengjie Ren", title = "Mixture-of-Languages Routing for Multilingual Dialogues", journal = j-TOIS, volume = "42", number = "6", pages = "165:1--165:??", month = nov, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3676956", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Oct 23 06:02:05 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3676956", abstract = "We consider multilingual dialogue systems and ask how the performance of a dialogue system can be improved by using information that is available in other languages than the language in which a conversation is being conducted. We adopt a collaborative \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "165", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Keshvari:2024:SDL, author = "Sanaz Keshvari and Farzan Saeedi and Hadi Sadoghi Yazdi and Faezeh Ensan", title = "A Self-Distilled Learning to Rank Model for Ad Hoc Retrieval", journal = j-TOIS, volume = "42", number = "6", pages = "166:1--166:??", month = nov, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3681784", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Oct 23 06:02:05 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3681784", abstract = "Learning to rank models are broadly applied in ad hoc retrieval for scoring and sorting documents based on their relevance to textual queries. The generalizability of the trained model in the learning to rank approach, however, can have an impact on the \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "166", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Liu:2024:CBG, author = "Fan Liu and Shuai Zhao and Zhiyong Cheng and Liqiang Nie and Mohan Kankanhalli", title = "Cluster-Based Graph Collaborative Filtering", journal = j-TOIS, volume = "42", number = "6", pages = "167:1--167:??", month = nov, year = "2024", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3687481", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Wed Oct 23 06:02:05 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3687481", abstract = "Graph Convolution Networks (GCNs) have significantly succeeded in learning user and item representations for recommendation systems. The core of their efficacy is the ability to explicitly exploit the collaborative signals from both the first- and high-. \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "167", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Liao:2025:RNS, author = "Weibin Liao and Yifan Zhu and Yanyan Li and Qi Zhang and Zhonghong Ou and Xuesong Li", title = "{RevGNN}: Negative Sampling Enhanced Contrastive Graph Learning for Academic Reviewer Recommendation", journal = j-TOIS, volume = "43", number = "1", pages = "1:1--1:??", month = jan, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3679200", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 18 06:29:56 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3679200", abstract = "Acquiring reviewers for academic submissions is a challenging recommendation scenario. Recent graph learning-driven models have made remarkable progress in the field of recommendation, but their performance in the academic reviewer recommendation task may \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "1", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Tavakoli:2025:OOE, author = "Leila Tavakoli and Johanne R. Trippas and Hamed Zamani and Falk Scholer and Mark Sanderson", title = "Online and Offline Evaluation in Search Clarification", journal = j-TOIS, volume = "43", number = "1", pages = "2:1--2:??", month = jan, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3681786", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 18 06:29:56 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3681786", abstract = "The effectiveness of clarification question models in engaging users within search systems is currently constrained, casting doubt on their overall usefulness. To improve the performance of these models, it is crucial to employ assessment approaches that \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "2", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Sang:2025:AAG, author = "Lei Sang and Honghao Li and Yiwen Zhang and Yi Zhang and Yun Yang", title = "{AdaGIN}: Adaptive Graph Interaction Network for Click-Through Rate Prediction", journal = j-TOIS, volume = "43", number = "1", pages = "3:1--3:??", month = jan, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3681785", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 18 06:29:56 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3681785", abstract = "The goal of click-through rate (CTR) prediction in recommender systems is to effectively work with input features. However, existing CTR prediction models face three main issues. First, many models use a basic approach for feature combinations, leading to \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Li:2025:CCE, author = "Honghao Li and Lei Sang and Yi Zhang and Xuyun Zhang and Yiwen Zhang", title = "{CETN}: Contrast-enhanced Through Network for Click-Through Rate Prediction", journal = j-TOIS, volume = "43", number = "1", pages = "4:1--4:??", month = jan, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3688571", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 18 06:29:56 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3688571", abstract = "Click-through rate (CTR) prediction is a crucial task in personalized information retrievals, such as industrial recommender systems, online advertising, and web search. Most existing CTR Prediction models utilize explicit feature interactions to overcome \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "4", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Tang:2025:TTC, author = "Haoran Tang and Shiqing Wu and Xueyao Sun and Jun Zeng and Guandong Xu and Qing Li", title = "{TCGC}: Temporal Collaboration-Aware Graph Co-Evolution Learning for Dynamic Recommendation", journal = j-TOIS, volume = "43", number = "1", pages = "5:1--5:??", month = jan, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3687470", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 18 06:29:56 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3687470", abstract = "Dynamic recommendation systems, where users interact with items continuously over time, have been widely deployed in real-world online streaming applications. The burst of interaction stream causes a rapid evolution of both users and items. To update \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "5", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Xu:2025:DCL, author = "Nuo Xu and Pinghui Wang and Junzhou Zhao and Feiyang Sun and Lin Lan and Jing Tao and Li Pan and Xiaohong Guan", title = "Distinguish Confusion in Legal Judgment Prediction via Revised Relation Knowledge", journal = j-TOIS, volume = "43", number = "1", pages = "6:1--6:??", month = jan, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3689628", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 18 06:29:56 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3689628", abstract = "Legal Judgment Prediction (LJP) aims to automatically predict a law case's judgment results based on the text description of its facts. In practice, the confusing law articles (or charges) problem frequently occurs, reflecting that the law cases \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "6", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2025:FEN, author = "Xiaoyu Zhang and Shaoyun Shi and Yishan Li and Weizhi Ma and Peijie Sun and Min Zhang", title = "Feature-Enhanced Neural Collaborative Reasoning for Explainable Recommendation", journal = j-TOIS, volume = "43", number = "1", pages = "7:1--7:??", month = jan, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3690381", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 18 06:29:56 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3690381", abstract = "Providing reasonable explanations for a specific suggestion given by the recommender can help users trust the system more. As logic rule-based inference is concise, transparent, and aligned with human cognition, it can be adopted to improve the \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "7", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Peng:2025:PEF, author = "Qiyao Peng and Hongyan Xu and Yinghui Wang and Hongtao Liu and Cuiying Huo and Wenjun Wang", title = "{PEPT}: Expert Finding Meets Personalized Pre-Training", journal = j-TOIS, volume = "43", number = "1", pages = "8:1--8:??", month = jan, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3690380", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 18 06:29:56 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3690380", abstract = "Finding experts is essential in Community Question Answering (CQA) platforms as it enables the effective routing of questions to potential users who can provide relevant answers. The key is to personalized learning expert representations based on their \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "8", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Anand:2025:SRS, author = "Vineeta Anand and Ashish Kumar Maurya", title = "A Survey on Recommender Systems Using Graph Neural Network", journal = j-TOIS, volume = "43", number = "1", pages = "9:1--9:??", month = jan, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3694784", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 18 06:29:56 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3694784", abstract = "The expansion of the Internet has resulted in a change in the flow of information. With the vast amount of digital information generated online, it is easy for users to feel overwhelmed. Finding the specific information can be a challenge, and it can be \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "9", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Cai:2025:DRS, author = "Qiqi Cai and Jian Cao and Guandong Xu and Nengjun Zhu", title = "Distributed Recommendation Systems: Survey and Research Directions", journal = j-TOIS, volume = "43", number = "1", pages = "10:1--10:??", month = jan, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3694783", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 18 06:29:56 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3694783", abstract = "With the explosive growth of online information, recommendation systems have become essential tools for alleviating information overload. In recent years, researchers have increasingly focused on centralized recommendation systems, capitalizing on the \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "10", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Xu:2025:LMT, author = "Chen Xu and Xiaopeng Ye and Jun Xu and Xiao Zhang and Weiran Shen and Ji-Rong Wen", title = "{LTP-MMF}: Toward Long-Term Provider Max-Min Fairness under Recommendation Feedback Loops", journal = j-TOIS, volume = "43", number = "1", pages = "11:1--11:??", month = jan, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3695867", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 18 06:29:56 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3695867", abstract = "Multi-stakeholder recommender systems involve various roles, such as users and providers. Previous work pointed out that max-min fairness (MMF) is a better metric to support weak providers. However, when considering MMF, the features or parameters of \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "11", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Li:2025:RPB, author = "Pu Li and Xiaoyan Yu and Hao Peng and Yantuan Xian and Linqin Wang and Li Sun and Jingyun Zhang and Philip S. Yu", title = "Relational Prompt-Based Pre-Trained Language Models for Social Event Detection", journal = j-TOIS, volume = "43", number = "1", pages = "12:1--12:??", month = jan, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3695869", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 18 06:29:56 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3695869", abstract = "Social Event Detection (SED) aims to identify significant events from social streams, and has a wide application ranging from public opinion analysis to risk management. In recent years, Graph Neural Network (GNN) based solutions have achieved state-of-. \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "12", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wan:2025:MGB, author = "Qizhi Wan and Changxuan Wan and Keli Xiao and Rong Hu and Dexi Liu and Guoqiong Liao and Xiping Liu and Yuxin Shuai", title = "A Multifocal Graph-Based Neural Network Scheme for Topic Event Extraction", journal = j-TOIS, volume = "43", number = "1", pages = "13:1--13:??", month = jan, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3696353", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 18 06:29:56 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3696353", abstract = "Event extraction is a long-standing and challenging task in natural language processing, and existing studies mainly focus on extracting events within sentences. However, a significant problem that has not been carefully investigated is whether an \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "13", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wu:2025:MLR, author = "Xuyang Wu and Ajit Puthenputhussery and Hongwei Shang and Changsung Kang and Yi Fang", title = "Meta-Learning to Rank for Sparsely Supervised Queries", journal = j-TOIS, volume = "43", number = "1", pages = "14:1--14:??", month = jan, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3698876", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 18 06:29:56 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3698876", abstract = "Supervisory signals are a critical resource for training learning to rank models. In many real-world search and retrieval scenarios, these signals may not be readily available or could be costly to obtain for some queries. The examples include domains \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "14", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Li:2025:RCD, author = "Bobo Li and Hao Fei and Fei Li and Shengqiong Wu and Lizi Liao and Yinwei Wei and Tat-seng Chua and Donghong Ji", title = "Revisiting Conversation Discourse for Dialogue Disentanglement", journal = j-TOIS, volume = "43", number = "1", pages = "15:1--15:??", month = jan, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3698191", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 18 06:29:56 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3698191", abstract = "Dialogue disentanglement aims to detach the chronologically ordered utterances into several independent sessions. Conversation utterances are essentially organized and described by the underlying discourse, and thus dialogue disentanglement requires the \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "15", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhou:2025:ECS, author = "Qi Zhou and Peng Zhang and Hansu Gu and Tun Lu and Ning Gu", title = "Exploring Cross-Site User Modeling without Cross-Site User Identity Linkage: a Case Study of Content Preference Prediction", journal = j-TOIS, volume = "43", number = "1", pages = "16:1--16:??", month = jan, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3697832", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 18 06:29:56 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3697832", abstract = "Performing user modeling on two or more social media platforms collaboratively and complementing each other (cross-site user modeling) has been a significant problem in the area of social media mining in recent years. The core of this problem is to get to \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "16", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Li:2025:ERF, author = "Jie Li and Yongli Ren and Mark Sanderson and Ke Deng", title = "Explaining Recommendation Fairness from a User\slash Item Perspective", journal = j-TOIS, volume = "43", number = "1", pages = "17:1--17:??", month = jan, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3698877", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 18 06:29:56 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3698877", abstract = "Recommender systems play a crucial role in personalizing user experiences, yet ensuring fairness in their outcomes remains an elusive challenge. This work explores the impact of individual users or items on the fairness of recommender systems, thus \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "17", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Lan:2025:CCL, author = "Wei Lan and Guoxian Zhou and Qingfeng Chen and Wenguang Wang and Shirui Pan and Yi Pan and Shichao Zhang", title = "Contrastive Clustering Learning for Multi-Behavior Recommendation", journal = j-TOIS, volume = "43", number = "1", pages = "18:1--18:??", month = jan, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3698192", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 18 06:29:56 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3698192", abstract = "Increasing multiple behavior recommendation models have achieved great successes. However, many models do not consider commonalities and differences between behaviors and data sparsity of the target behavior. This article proposes a novel multi-behavior \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "18", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2025:DDG, author = "Zeyang Zhang and Xin Wang and Haibo Chen and Haoyang Li and Wenwu Zhu", title = "Disentangled Dynamic Graph Attention Network for Out-of-Distribution Sequential Recommendation", journal = j-TOIS, volume = "43", number = "1", pages = "19:1--19:??", month = jan, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3701988", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 18 06:29:56 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3701988", abstract = "Sequential recommendation, leveraging user-item interaction histories to provide personalized and timely suggestions, has drawn significant research interest recently. With the power of exploiting spatio-temporal dynamics, Dynamic Graph Neural Networks \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "19", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhu:2025:MBR, author = "Xi Zhu and Fake Lin and Ziwei Zhao and Tong Xu and Xiangyu Zhao and Zikai Yin and Xueying Li and Enhong Chen", title = "Multi-Behavior Recommendation with Personalized Directed Acyclic Behavior Graphs", journal = j-TOIS, volume = "43", number = "1", pages = "20:1--20:??", month = jan, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3696417", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 18 06:29:56 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3696417", abstract = "A well-developed recommendation system can not only leverage multi-typed interactions (such as page view, add-to-cart, and purchase ) to better identify user preferences but also demonstrate high performance, low complexity, and strong interpretability. \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "20", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wu:2025:LRS, author = "Shiguang Wu and Xin Xin and Pengjie Ren and Zhumin Chen and Jun Ma and Maarten de Rijke and Zhaochun Ren", title = "Learning Robust Sequential Recommenders through Confident Soft Labels", journal = j-TOIS, volume = "43", number = "1", pages = "21:1--21:??", month = jan, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3700876", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 18 06:29:56 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3700876", abstract = "Sequential recommenders that are trained on implicit feedback are usually learned as a multi-class classification task through softmax-based loss functions on one-hot class labels. However, one-hot training labels are sparse and may lead to biased \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "21", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2025:SLE, author = "Yi Zhang and Yiwen Zhang and Lei Sang and Victor S. Sheng", title = "Simplify to the Limit! {Embedding}-Less Graph Collaborative Filtering for Recommender Systems", journal = j-TOIS, volume = "43", number = "1", pages = "22:1--22:??", month = jan, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3701230", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 18 06:29:56 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3701230", abstract = "The tremendous positive driving effect of Graph Convolutional Network (GCN) and Graph Contrastive Learning (GCL) for recommender systems has become a consensus. GCN encoders are extensively used in recommendation models for capturing high-order \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "22", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wang:2025:UVM, author = "Guolong Wang and Xun Wu and Xun Tu and Zhaoyuan Liu and Junchi Yan", title = "Unsupervised Video Moment Retrieval with Knowledge-Based Pseudo-Supervision Construction", journal = j-TOIS, volume = "43", number = "1", pages = "23:1--23:??", month = jan, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3701229", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 18 06:29:56 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3701229", abstract = "Video moment retrieval locates a specified moment by a sentence query. Recent approaches have made remarkable advancements with large-scale video-sentence annotations. These annotations require extensive human labor and expertise, leading to the need for \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "23", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wang:2025:MAA, author = "Shijie Wang and Wenqi Fan and Xiao-Yong Wei and Xiaowei Mei and Shanru Lin and Qing Li", title = "Multi-Agent Attacks for Black-Box Social Recommendations", journal = j-TOIS, volume = "43", number = "1", pages = "24:1--24:??", month = jan, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3696105", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 18 06:29:56 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3696105", abstract = "The rise of online social networks has facilitated the evolution of social recommender systems, which incorporate social relations to enhance users' decision-making process. With the great success of Graph Neural Networks (GNNs) in learning node \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "24", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Chen:2025:PTA, author = "Chaochao Chen and Yizhao Zhang and Yuyuan Li and Jun Wang and Lianyong Qi and Xiaolong Xu and Xiaolin Zheng and Jianwei Yin", title = "Post-Training Attribute Unlearning in Recommender Systems", journal = j-TOIS, volume = "43", number = "1", pages = "25:1--25:??", month = jan, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3701987", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 18 06:29:56 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3701987", abstract = "With the growing privacy concerns in recommender systems, recommendation unlearning is getting increasing attention. Existing studies predominantly use training data, i.e., model inputs, as unlearning target. However, attackers can extract private \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "25", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2025:VTG, author = "Shuo Zhang and Xiangwu Meng and Yujie Zhang", title = "Variational Type Graph Autoencoder for Denoising on Event Recommendation", journal = j-TOIS, volume = "43", number = "1", pages = "26:1--26:??", month = jan, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3703156", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 18 06:29:56 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3703156", abstract = "Recommendations for events play a pivotal role in facilitating the discovery of upcoming intriguing events within Event-Based Social Networks (EBSNs). Previous research has established the crucial significance of mining contextual features and implicit \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "26", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wang:2025:PTMa, author = "Wenjie Wang and Zheng Liu and Fuli Feng and Zhicheng Dou and Qingyao Ai and Grace Hui Yang and Defu Lian and Lu Hou and Aixin Sun and Hamed Zamani and Donald Metzler and Maarten de Rijke", title = "Pre-Trained Models for Search and Recommendation: Introduction to the Special Issue --- {Part 1}", journal = j-TOIS, volume = "43", number = "2", pages = "27:1--27:??", month = mar, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3709134", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Feb 21 09:19:58 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3709134", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "27", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Lin:2025:HCR, author = "Jianghao Lin and Xinyi Dai and Yunjia Xi and Weiwen Liu and Bo Chen and Hao Zhang and Yong Liu and Chuhan Wu and Xiangyang Li and Chenxu Zhu and Huifeng Guo and Yong Yu and Ruiming Tang and Weinan Zhang", title = "How Can Recommender Systems Benefit from Large Language Models: a Survey", journal = j-TOIS, volume = "43", number = "2", pages = "28:1--28:??", month = mar, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3678004", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Feb 21 09:19:58 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3678004", abstract = "With the rapid development of online services and web applications, recommender systems (RS) have become increasingly indispensable for mitigating information overload and matching users' information needs by providing personalized suggestions over items. \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "28", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wang:2025:ADS, author = "Xin Wang and Hong Chen and Zirui Pan and Yuwei Zhou and Chaoyu Guan and Lifeng Sun and Wenwu Zhu", title = "Automated Disentangled Sequential Recommendation with Large Language Models", journal = j-TOIS, volume = "43", number = "2", pages = "29:1--29:??", month = mar, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3675164", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Feb 21 09:19:58 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3675164", abstract = "Sequential recommendation aims to recommend the next items that a target user may have interest in based on the user's sequence of past behaviors, which has become a hot research topic in both academia and industry. In the literature, sequential \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "29", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wang:2025:MGM, author = "Hao Wang and Mingjia Yin and Luankang Zhang and Sirui Zhao and Enhong Chen", title = "{MF-GSLAE}: a Multi-Factor User Representation Pre-Training Framework for Dual-Target Cross-Domain Recommendation", journal = j-TOIS, volume = "43", number = "2", pages = "30:1--30:??", month = mar, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3690382", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Feb 21 09:19:58 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3690382", abstract = "Recently, the dual-target cross-domain recommendation has been an emerging research problem, which aims to improve the performances of both source and target domains by transferring the preferences of overlapping users. Most of the existing work adopted a \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "30", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Di:2025:FRS, author = "Yicheng Di and Hongjian Shi and Xiaoming Wang and Ruhui Ma and Yuan Liu", title = "Federated Recommender System Based on Diffusion Augmentation and Guided Denoising", journal = j-TOIS, volume = "43", number = "2", pages = "31:1--31:??", month = mar, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3688570", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Feb 21 09:19:58 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3688570", abstract = "Sequential recommender systems often struggle with accurate personalized recommendations due to data sparsity issues. Existing works use variational autoencoders and generative adversarial network methods to enrich sparse data. However, they often \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "31", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Peng:2025:DAL, author = "Yingtao Peng and Chen Gao and Yu Zhang and Tangpeng Dan and Xiaoyi Du and Hengliang Luo and Yong Li and Xiaofeng Meng", title = "Denoising Alignment with Large Language Model for Recommendation", journal = j-TOIS, volume = "43", number = "2", pages = "32:1--32:??", month = mar, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3696662", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Feb 21 09:19:58 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3696662", abstract = "The mainstream approach of GNN-based recommendation aggregates high-order ID information associated with the node in the user-item graph. The aggregation pattern using ID as signal has two disadvantages: lack of textual semantics and the impact of \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "32", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2025:MLP, author = "Dan Zhang and Shaojie Zheng and Yifan Zhu and Huihui Yuan and Jibing Gong and Jie Tang", title = "{MCAP}: Low-Pass {GNNs} with Matrix Completion for Academic Recommendations", journal = j-TOIS, volume = "43", number = "2", pages = "33:1--33:??", month = mar, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3698193", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Feb 21 09:19:58 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3698193", abstract = "Graph neural networks (GNNs) are commonly used and have shown promising performance in recommendation systems. A major branch, heterogeneous GNNs, models heterogeneous information by leveraging side information for academic paper recommendations. These \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "33", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Xu:2025:GAE, author = "Lixiang Xu and Yusheng Liu and Tong Xu and Enhong Chen and Yuanyan Tang", title = "Graph Augmentation Empowered Contrastive Learning for Recommendation", journal = j-TOIS, volume = "43", number = "2", pages = "34:1--34:??", month = mar, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3677377", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Feb 21 09:19:58 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3677377", abstract = "The application of contrastive learning (CL) to collaborative filtering (CF) in recommender systems has achieved remarkable success. CL-based recommendation models mainly focus on creating multiple augmented views by employing different graph augmentation \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "34", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Guo:2025:CCL, author = "Jiafeng Guo and Yinqiong Cai and Keping Bi and Yixing Fan and Wei Chen and Ruqing Zhang and Xueqi Cheng", title = "{CAME}: Competitively Learning a Mixture-of-Experts Model for First-stage Retrieval", journal = j-TOIS, volume = "43", number = "2", pages = "35:1--35:??", month = mar, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3678880", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Feb 21 09:19:58 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3678880", abstract = "The first-stage retrieval aims to retrieve a subset of candidate documents from a huge collection both effectively and efficiently. Since various matching patterns can exist between queries and relevant documents, previous work tries to combine multiple \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "35", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2025:SMS, author = "Xu Zhang and Zexu Lin and Xiaoyu Hu and Jianlei Wang and Wenpeng Lu and De-Yu Zhou", title = "{SECON}: Maintaining Semantic Consistency in Data Augmentation for Code Search", journal = j-TOIS, volume = "43", number = "2", pages = "36:1--36:??", month = mar, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3686151", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Feb 21 09:19:58 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3686151", abstract = "Efficient code search techniques are crucial in accelerating software development by aiding developers in locating specific code snippets and understanding code functionalities. This study investigates code search methodologies, focusing on the emerging \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "36", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Ge:2025:LEC, author = "Hongfei Ge and Yuanchun Jiang and Jianshan Sun and Kun Yuan and Yezheng Liu", title = "{LLM}-Enhanced Composed Image Retrieval: an Intent Uncertainty-Aware Linguistic-Visual Dual Channel Matching Model", journal = j-TOIS, volume = "43", number = "2", pages = "37:1--37:??", month = mar, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3699715", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Feb 21 09:19:58 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3699715", abstract = "Composed image retrieval (CoIR) involves a multi-modal query of the reference image and modification text describing the desired changes, allowing users to express image retrieval intents flexibly and effectively. The key of CoIR lies in how to properly \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "37", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Jafarzadeh:2025:KGE, author = "Parastoo Jafarzadeh and Faezeh Ensan and Mahdiyar Ali Akbar Alavi and Fattane Zarrinkalam", title = "A Knowledge Graph Embedding Model for Answering Factoid Entity Questions", journal = j-TOIS, volume = "43", number = "2", pages = "38:1--38:??", month = mar, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3678003", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Feb 21 09:19:58 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3678003", abstract = "Factoid entity questions (FEQ), which seek answers in the form of a single entity from knowledge sources, such as DBpedia and Wikidata, constitute a substantial portion of user queries in search engines. This article introduces the knowledge graph \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "38", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Li:2025:BCA, author = "Xinze Li and Hanbin Wang and Zhenghao Liu and Shi Yu and Shuo Wang and Yukun Yan and Yukai Fu and Yu Gu and Ge Yu", title = "Building a Coding Assistant via the Retrieval-Augmented Language Model", journal = j-TOIS, volume = "43", number = "2", pages = "39:1--39:??", month = mar, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3695868", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Feb 21 09:19:58 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3695868", abstract = "Pretrained language models have shown strong effectiveness in code-related tasks, such as code retrieval, code generation, code summarization, and code completion tasks. In this article, we propose COde assistaNt viA retrieval-augmeNted language model \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "39", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Mao:2025:FRB, author = "Yuren Mao and Xuemei Dong and Wenyi Xu and Yunjun Gao and Bin Wei and Ying Zhang", title = "{FIT-RAG}: Black-Box {RAG} with Factual Information and Token Reduction", journal = j-TOIS, volume = "43", number = "2", pages = "40:1--40:??", month = mar, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3676957", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Feb 21 09:19:58 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3676957", abstract = "Due to the extraordinarily large number of parameters, fine-tuning large language models (LLMs) to update long-tail or out-of-date knowledge is impractical in lots of applications. To avoid fine-tuning, we can alternatively treat a LLM as a black-box \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "40", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Lyu:2025:CRC, author = "Yuanjie Lyu and Zhiyu Li and Simin Niu and Feiyu Xiong and Bo Tang and Wenjin Wang and Hao Wu and Huanyong Liu and Tong Xu and Enhong Chen", title = "{CRUD-RAG}: a Comprehensive {Chinese} Benchmark for Retrieval-Augmented Generation of Large Language Models", journal = j-TOIS, volume = "43", number = "2", pages = "41:1--41:??", month = mar, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3701228", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Feb 21 09:19:58 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3701228", abstract = "Retrieval-augmented generation (RAG) is a technique that enhances the capabilities of large language models (LLMs) by incorporating external knowledge sources. This method addresses common LLM limitations, including outdated information and the tendency \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "41", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Huang:2025:SHL, author = "Lei Huang and Weijiang Yu and Weitao Ma and Weihong Zhong and Zhangyin Feng and Haotian Wang and Qianglong Chen and Weihua Peng and Xiaocheng Feng and Bing Qin and Ting Liu", title = "A Survey on Hallucination in Large Language Models: Principles, Taxonomy, Challenges, and Open Questions", journal = j-TOIS, volume = "43", number = "2", pages = "42:1--42:??", month = mar, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3703155", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Feb 21 09:19:58 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3703155", abstract = "The emergence of large language models (LLMs) has marked a significant breakthrough in natural language processing (NLP), fueling a paradigm shift in information acquisition. Nevertheless, LLMs are prone to hallucination, generating plausible yet \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "42", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Bevilacqua:2025:WAA, author = "Marialena Bevilacqua and Kezia Oketch and Ruiyang Qin and Will Stamey and Xinyuan Zhang and Yi Gan and Kai Yang and Ahmed Abbasi", title = "When Automated Assessment Meets Automated Content Generation: Examining Text Quality in the Era of {GPTs}", journal = j-TOIS, volume = "43", number = "2", pages = "43:1--43:??", month = mar, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3702639", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Feb 21 09:19:58 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3702639", abstract = "The use of machine learning (ML) models to assess and score textual data has become increasingly pervasive in an array of contexts including natural language processing, information retrieval, search and recommendation, and credibility assessment of \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "43", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Liu:2025:UBR, author = "Fan Liu and Yaqi Liu and Huilin Chen and Zhiyong Cheng and Liqiang Nie and Mohan Kankanhalli", title = "Understanding Before Recommendation: Semantic Aspect-Aware Review Exploitation via Large Language Models", journal = j-TOIS, volume = "43", number = "2", pages = "44:1--44:??", month = mar, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3704999", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Feb 21 09:19:58 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3704999", abstract = "Recommendation systems harness user-item interactions like clicks and reviews to learn their representations. Previous studies improve recommendation accuracy and interpretability by modeling user preferences across various aspects and intents. However, \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "44", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Cunha:2025:NOR, author = "Washington Cunha and Alejandro Moreo Fern{\'a}ndez and Andrea Esuli and Fabrizio Sebastiani and Leonardo Rocha and Marcos Andr{\'e} Gon{\c{c}}alves", title = "A Noise-Oriented and Redundancy-Aware Instance Selection Framework", journal = j-TOIS, volume = "43", number = "2", pages = "45:1--45:??", month = mar, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3705000", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Feb 21 09:19:58 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3705000", abstract = "Fine-tuning transformer-based deep-learning models are currently at the forefront of natural language processing (NLP) and information retrieval (IR) tasks. However, fine-tuning these transformers for specific tasks, especially when dealing with ever-. \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "45", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Sun:2025:MAL, author = "Ying Sun and Yang Ji and Hengshu Zhu and Fuzhen Zhuang and Qing He and Hui Xiong", title = "Market-aware Long-term Job Skill Recommendation with Explainable Deep Reinforcement Learning", journal = j-TOIS, volume = "43", number = "2", pages = "46:1--46:??", month = mar, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3704998", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Feb 21 09:19:58 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3704998", abstract = "Continuously learning new skills is essential for talents to gain a competitive advantage in the labor market. Despite extensive efforts on relevance- or preference-based skill recommendations, little attention has been given to the practical effects of \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "46", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2025:ACM, author = "Leping Zhang and Xiao Zhang and Yichao Wang and Xuan Li and Zhenhua Dong and Jun Xu", title = "Adapting Constrained {Markov} Decision Process for {OCPC} Bidding with Delayed Conversions", journal = j-TOIS, volume = "43", number = "2", pages = "47:1--47:??", month = mar, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3706420", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Feb 21 09:19:58 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3706420", abstract = "Nowadays, optimized cost-per-click (OCPC) has been widely adopted in online advertising. In OCPC, the advertiser sets an expected cost-per-conversion and pays per click, while the platform automatically adjusts the bid on each click to meet advertiser's \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "47", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Huynh:2025:CUF, author = "Thanh Trung Huynh and Trong Bang Nguyen and Thanh Toan Nguyen and Phi Le Nguyen and Hongzhi Yin and Quoc Viet Hung Nguyen and Thanh Tam Nguyen", title = "Certified Unlearning for Federated Recommendation", journal = j-TOIS, volume = "43", number = "2", pages = "48:1--48:??", month = mar, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3706419", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Feb 21 09:19:58 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3706419", abstract = "Recommendation systems play a crucial role in providing web-based suggestion utilities by leveraging user behavior, preferences, and interests. In the context of privacy concerns and the proliferation of handheld devices, federated recommender systems \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "48", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Dang:2025:EAR, author = "Yizhou Dang and Yuting Liu and Enneng Yang and Guibing Guo and Linying Jiang and Jianzhe Zhao and Xingwei Wang", title = "Efficient and Adaptive Recommendation Unlearning: a Guided Filtering Framework to Erase Outdated Preferences", journal = j-TOIS, volume = "43", number = "2", pages = "49:1--49:??", month = mar, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3706633", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Feb 21 09:19:58 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3706633", abstract = "Recommendation unlearning is an emerging task to erase the influences of user-specified data from a trained recommendation model. Most existing research follows the paradigm of partitioning the original dataset into multi-fold and then retraining \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "49", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wang:2025:PPS, author = "Wei Wang and Yujie Lin and Pengjie Ren and Zhumin Chen and Tsunenori Mine and Jianli Zhao and Qiang Zhao and Moyan Zhang and Xianye Ben and Yujun Li", title = "Privacy-Preserving Sequential Recommendation with Collaborative Confusion", journal = j-TOIS, volume = "43", number = "2", pages = "50:1--50:??", month = mar, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3707204", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Feb 21 09:19:58 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3707204", abstract = "Sequential recommendation has attracted a lot of attention from both academia and industry, however the privacy risks associated with gathering and transferring users' personal interaction data are often underestimated or ignored. Existing privacy-. \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "50", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2025:SDA, author = "Qin Zhang and Mengqi Zheng and Shangsi Chen and Han Liu and Meng Fang", title = "Self Data Augmentation for Open Domain Question Answering", journal = j-TOIS, volume = "43", number = "2", pages = "51:1--51:??", month = mar, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3707449", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Feb 21 09:19:58 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3707449", abstract = "Information Retrieval (IR) constitutes a vital facet of Open Domain Question Answering (ODQA) systems, focusing on the exploration of pertinent information within extensive collections of passages, such as Wikipedia, to facilitate subsequent reader \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "51", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Yuan:2025:PFP, author = "Wei Yuan and Chaoqun Yang and Liang Qu and Quoc Viet Hung Nguyen and Guanhua Ye and Hongzhi Yin", title = "{PTF-FSR}: a Parameter Transmission-Free Federated Sequential Recommender System", journal = j-TOIS, volume = "43", number = "2", pages = "52:1--52:??", month = mar, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3708344", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Feb 21 09:19:58 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3708344", abstract = "Sequential recommender systems, as a specialized branch of recommender systems that can capture users' dynamic preferences for more accurate and timely recommendations, have made significant progress. Recently, due to increasing concerns about user data \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "52", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Chen:2025:DES, author = "Nuo Chen and Jiqun Liu and Hanpei Fang and Yuankai Luo and Tetsuya Sakai and Xiao-Ming Wu", title = "Decoy Effect in Search Interaction: Understanding User Behavior and Measuring System Vulnerability", journal = j-TOIS, volume = "43", number = "2", pages = "53:1--53:??", month = mar, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3708884", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Feb 21 09:19:58 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3708884", abstract = "This study addresses (1) the influence of the decoy effect, a cognitive bias where the presence of an inferior item alters preferences between two options, on users' search interactions and (2) the measurement of information retrieval systems' \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "53", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Qu:2025:TMM, author = "Zekai Qu and Ruobing Xie and Chaojun Xiao and Yuan Yao and Zhiyuan Liu and Fengzong Lian and Zhanhui Kang and Jie Zhou", title = "Thoroughly Modeling Multi-domain Pre-trained Recommendation as Language", journal = j-TOIS, volume = "43", number = "2", pages = "54:1--54:??", month = mar, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3708883", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Feb 21 09:19:58 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3708883", abstract = "With the thriving of the pre-trained language model (PLM) widely verified in various NLP tasks, pioneer efforts attempt to explore the possible cooperation of the general textual information in PLM with the personalized behavioral information in user \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "54", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wang:2025:UBS, author = "Lei Wang and Jingsen Zhang and Hao Yang and Zhi-Yuan Chen and Jiakai Tang and Zeyu Zhang and Xu Chen and Yankai Lin and Hao Sun and Ruihua Song and Xin Zhao and Jun Xu and Zhicheng Dou and Jun Wang and Ji-Rong Wen", title = "User Behavior Simulation with Large Language Model-based Agents", journal = j-TOIS, volume = "43", number = "2", pages = "55:1--55:??", month = mar, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3708985", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Feb 21 09:19:58 MST 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", URL = "https://dl.acm.org/doi/10.1145/3708985", abstract = "Simulating high quality user behavior data has always been a fundamental yet challenging problem in human-centered applications such as recommendation systems, social networks, among many others. The major difficulty of user behavior simulation originates \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "55", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Yom-Tov:2025:SEO, author = "Elad Yom-Tov and Liat Levontin", title = "The In-Situ Effect of Offensive Ads on Search Engine Users", journal = j-TOIS, volume = "43", number = "3", pages = "56:1--56:??", month = may, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3704438", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 20 07:06:58 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Unscrupulous advertisers may try to increase attention to search ads by using offensive ads, which can increase attention and recall to the detriment of individuals and society. Here, we investigate whether offensive ads, when shown to search engine users, \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "56", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Liu:2025:CPM, author = "Qidong Liu and Zhaopeng Qiu and Xiangyu Zhao and Xian Wu and Zijian Zhang and Tong Xu and Feng Tian", title = "A Contrastive Pretrain Model with Prompt Tuning for Multi-center Medication Recommendation", journal = j-TOIS, volume = "43", number = "3", pages = "57:1--57:??", month = may, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3706631", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 20 07:06:58 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Medication recommendation is one of the most critical health-related applications, which has attracted extensive research interest recently. Most existing works focus on a single hospital with abundant medical data. However, many small hospitals only have \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "57", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Yu:2025:DCD, author = "Yi Yu and Kazunari Sugiyama and Adam Jatowt", title = "Domain Counterfactual Data Augmentation for Explainable Recommendation", journal = j-TOIS, volume = "43", number = "3", pages = "58:1--58:??", month = may, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3711856", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 20 07:06:58 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Providing explanations for recommendation decisions is crucial for enhancing user trust and satisfaction in recommender systems. However, existing generative methods often produce generic, repetitive explanation texts that fail to reflect the true reasons \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "58", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Hu:2025:EER, author = "Linmei Hu and Xinyu Zhang and Dandan Song and Changzhi Zhou and Hongyu He and Liqiang Nie", title = "Efficient and Effective Role Player: a Compact Knowledge-grounded Persona-based Dialogue Model Enhanced by {LLM} Distillation", journal = j-TOIS, volume = "43", number = "3", pages = "59:1--59:??", month = may, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3711857", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 20 07:06:58 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Incorporating explicit personas into dialogue models is critical for generating responses that fulfill specific user needs and preferences, creating a more personalized and engaging interaction. Early works on persona-based dialogue generation directly \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "59", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Yu:2025:MMV, author = "Li Yu and Jianyong Hu and Qihan Du and Xi Niu", title = "{MVideoRec}: Micro Video Recommendations through Modality Decomposition and Contrastive Learning", journal = j-TOIS, volume = "43", number = "3", pages = "60:1--60:??", month = may, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3711855", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 20 07:06:58 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Personalized micro video recommendation aims to recommend the micro videos tailored to user preference based on the user's interaction history with the micro videos, which has drawn increasing attention from both the academic and industrial communities. \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "60", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Liu:2025:CTC, author = "Zirui Liu and Hailin Zhang and Boxuan Chen and Zihan Jiang and Yikai Zhao and Yangyu Tao and Tong Yang and Bin Cui", title = "{CAFE+}: Towards Compact, Adaptive, and Fast Embedding for Large-scale Online Recommendation Models", journal = j-TOIS, volume = "43", number = "3", pages = "61:1--61:??", month = may, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3713072", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 20 07:06:58 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The growing memory demands of embedding tables in Deep Learning Recommendation Models (DLRMs) pose great challenges for model training and deployment. Existing embedding compression solutions cannot simultaneously achieve memory efficiency, low latency, \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "61", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Liu:2025:ANI, author = "Yuanxing Liu and Jiahuan Pei and Wei-Nan Zhang and Ming Li and Wanxiang Che and Maarten de Rijke", title = "Augmentation with Neighboring Information for Conversational Recommendation", journal = j-TOIS, volume = "43", number = "3", pages = "62:1--62:??", month = may, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3712588", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 20 07:06:58 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Conversational recommender systems (CRSs) suggest items to users by understanding their needs and preferences from natural language conversations. While users can freely express preferences, modeling needs and preferences solely from users' conversations \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "62", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Tran:2025:TPB, author = "Hung Vinh Tran and Tong Chen and Nguyen {Quoc Viet Hung} and Zi Huang and Lizhen Cui and Hongzhi Yin", title = "A Thorough Performance Benchmarking on Lightweight Embedding-based Recommender Systems", journal = j-TOIS, volume = "43", number = "3", pages = "63:1--63:??", month = may, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3712589", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 20 07:06:58 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Since the creation of the Web, recommender systems (RSs) have been an indispensable personalization mechanism in information filtering. Most state-of-the-art RSs primarily depend on categorical features such as user and item IDs, and use embedding vectors \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "63", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2025:KDK, author = "Haonan Zhang and Dongxia Wang and Zhu Sun and Yanhui Li and Youcheng Sun and Huizhi Liang and Wenhai Wang", title = "{KG4RecEval}: Does Knowledge Graph Really Matter for Recommender Systems?", journal = j-TOIS, volume = "43", number = "3", pages = "64:1--64:??", month = may, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3713071", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 20 07:06:58 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Recommender systems (RSs) are designed to provide personalized recommendations to users. Recently, knowledge graphs (KGs) have been widely introduced in RSs to improve recommendation accuracy. In this study, however, we demonstrate that RSs do not \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "64", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Liu:2025:SAC, author = "Bulou Liu and Yiran Hu and Qingyao Ai and Yueyue Wu and Yiqun Liu and Chenliang Li and Fan Zhang and Weixing Shen and Chong Chen and Qi Tian", title = "Structure-Aware Conversational Legal Case Retrieval", journal = j-TOIS, volume = "43", number = "3", pages = "65:1--65:??", month = may, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3711854", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 20 07:06:58 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Legal case retrieval is an important task in information retrieval that aims to retrieve relevant cases for given query cases. Conversational search paradigms have been shown to improve the search experience in legal case retrieval. However, there are two \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "65", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wang:2025:GEP, author = "Zihan Wang and Hanbing Wang and Pengjie Ren and Zhumin Chen and Maarten de Rijke and Zhaochun Ren", title = "Graph-Enhanced Prompt Learning for Cross-Domain Contract Element Extraction", journal = j-TOIS, volume = "43", number = "3", pages = "66:1--66:??", month = may, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3715100", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 20 07:06:58 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Cross-domain contract element extraction (CEE) aims to transfer knowledge from a source domain to facilitate the extraction of legally relevant elements (e.g., contract dates or payments) from contracts in a target domain. To achieve this goal, recent \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "66", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Deng:2025:PCA, author = "Yang Deng and Lizi Liao and Wenqiang Lei and Grace Hui Yang and Wai Lam and Tat-Seng Chua", title = "Proactive Conversational {AI}: a Comprehensive Survey of Advancements and Opportunities", journal = j-TOIS, volume = "43", number = "3", pages = "67:1--67:??", month = may, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3715097", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 20 07:06:58 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Dialogue systems are designed to offer human users social support or functional services through natural language interactions. Traditional conversation research has put significant emphasis on a system's response-ability, including its capacity to \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "67", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wang:2025:EHH, author = "Hao Wang and Bin Guo and Yating Zeng and Mengqi Chen and Yasan Ding and Ying Zhang and Lina Yao and Zhiwen Yu", title = "Enabling Harmonious Human-Machine Interaction with Visual-Context Augmented Dialogue System: a Review", journal = j-TOIS, volume = "43", number = "3", pages = "68:1--68:??", month = may, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3715098", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 20 07:06:58 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The intelligent dialogue system, aiming at communicating with humans harmoniously with natural language, is brilliant for promoting the advancement of human-machine interaction in the era of artificial intelligence. With the gradually complex human-. \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "68", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Yang:2025:OVF, author = "Enyue Yang and Weike Pan and Lixin Fan and Hanlin Gu and Zhitao Li and Qiang Yang and Zhong Ming", title = "Ownership Verification for Federated Recommendation", journal = j-TOIS, volume = "43", number = "3", pages = "69:1--69:??", month = may, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3715320", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 20 07:06:58 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Most federated learning-based recommender systems allow clients to access a well-trained high-quality model locally, which provides adversaries with the opportunity to infringe the legitimate copyright of the model. In response, we study an emerging and \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "69", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Lin:2025:CMD, author = "Xixun Lin and Rui Liu and Yanan Cao and Lixin Zou and Qian Li and Yongxuan Wu and Yang Liu and Dawei Yin and Guandong Xu", title = "Contrastive Modality-Disentangled Learning for Multimodal Recommendation", journal = j-TOIS, volume = "43", number = "3", pages = "70:1--70:??", month = may, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3715876", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 20 07:06:58 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Multimodal recommendation, which utilizes rich multimodal information to learn user preferences, has attracted significant attention. Most works focus on designing powerful encoders for extracting multimodal features, and simply aggregate the learned \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "70", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2025:UPA, author = "Haobo Zhang and Qiannan Zhu and Zhicheng Dou", title = "A Unified Prompt-aware Framework for Personalized Search and Explanation Generation", journal = j-TOIS, volume = "43", number = "3", pages = "71:1--71:??", month = may, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3716131", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 20 07:06:58 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Product search is crucial for users to find and purchase products they need. Personalized product search, which models users' search intent and provides tailored results, has become a prominent research problem in industry and academia. Recent studies \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "71", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Mao:2025:RPP, author = "Wenyu Mao and Jiancan Wu and Weijian Chen and Chongming Gao and Xiang Wang and Xiangnan He", title = "Reinforced Prompt Personalization for Recommendation with Large Language Models", journal = j-TOIS, volume = "43", number = "3", pages = "72:1--72:??", month = may, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3716320", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 20 07:06:58 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Designing effective prompts can empower LLMs to understand user preferences and provide recommendations with intent comprehension and knowledge utilization capabilities. Nevertheless, recent studies predominantly concentrate on task-wise prompting, \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "72", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Liu:2025:AGE, author = "Zunlong Liu and Yang Xu and Gao Cong and Lei Zhu and Qinjun Qiu and Huaxiang Zhang", title = "{ARTS}: a General and Efficient Multi-Task Self-Prompt Framework for Explainable Sequential Recommendation", journal = j-TOIS, volume = "43", number = "3", pages = "73:1--73:??", month = may, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3717833", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 20 07:06:58 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Providing sequential recommendations along with easily comprehensible natural language explanations can significantly enhance users' trust in the recommender systems. However, this approach presents two key challenges: (1) The different objectives of the \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "73", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2025:REU, author = "Junjie Zhang and Wenqi Sun and Yupeng Hou and Xin Zhao and Ji-Rong Wen", title = "Review-Enhanced Universal Sequence Representation Learning for Recommender Systems", journal = j-TOIS, volume = "43", number = "3", pages = "74:1--74:??", month = may, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3717832", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 20 07:06:58 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "With the widespread deployment of recommender systems on various online platforms, researchers are striving to develop transferable recommendation algorithms that can effectively adapt to new task scenarios without requiring the re-training of new \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "74", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Cui:2025:RDR, author = "Jiajun Cui and Hong Qian and Chanjin Zheng and Lu Wang and Mo Yu and Wei Zhang", title = "Rebalancing Discriminative Responses for Knowledge Tracing", journal = j-TOIS, volume = "43", number = "3", pages = "75:1--75:??", month = may, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3716821", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 20 07:06:58 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Knowledge Tracing (KT) is a crucial task in computer-aided education and intelligent tutoring systems, predicting students' performance on new questions from their responses to prior ones. An accurate KT model can capture a student's mastery level of \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "75", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Li:2025:ISD, author = "Dongyang Li and Jianshan Sun and Chongming Gao and Fuli Feng and Kun Yuan", title = "Independent or Social Driven Decision? A Counterfactual Refinement Strategy for Graph-Based Social Recommendation", journal = j-TOIS, volume = "43", number = "3", pages = "76:1--76:??", month = may, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3717830", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 20 07:06:58 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Social recommendation models have traditionally relied on social homophily to enhance user preference prediction by incorporating information from socially connected friends. However, this approach neglects the diverse nature of social relationships. \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "76", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2025:MMR, author = "Chengde Zhang and Zihan Zhang and Jiaying Huang and Yan Liu and Dawei Jin and Xia Xiao and Zuwu Shen", title = "{MKCRec}: Meta-relation guided Knowledge Coupling for Paper Recommendation", journal = j-TOIS, volume = "43", number = "3", pages = "77:1--77:??", month = may, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3715101", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 20 07:06:58 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "With the surge of academic papers, it has become a common practice to recommend papers based on authors' research interests. Existing methods focus on leveraging author-paper research interactions to mine authors' research interests with coauthorship \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "77", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2025:VPP, author = "Gangyi Zhang and Chongming Gao and Wenqiang Lei and Xiaojie Guo and Shijun Li and Hongshen Chen and Zhuozhi Ding and Sulong Xu and Lingfei Wu", title = "Vague Preference Policy Learning for Conversational Recommendation", journal = j-TOIS, volume = "43", number = "3", pages = "78:1--78:??", month = may, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3717831", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 20 07:06:58 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Conversational Recommendation Systems (CRS) effectively address information asymmetry by dynamically eliciting user preferences through multi-turn interactions. However, existing CRS methods commonly assume that users have clear, definite preferences for \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "78", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2025:LYE, author = "Jinyu Zhang and Chao Li and Zhongying Zhao", title = "Lightweight yet Efficient: an External Attentive Graph Convolutional Network with Positional Prompts for Sequential Recommendation", journal = j-TOIS, volume = "43", number = "3", pages = "79:1--79:??", month = may, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3719343", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 20 07:06:58 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Graph-Based Sequential Recommender Systems (GSRSs) have gained significant research attention due to their ability to simultaneously handle user-item interactions and sequential relationships between items. Current GSRSs often utilize composite or in-. \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "79", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhao:2025:SGC, author = "Chu Zhao and Enneng Yang and Yuliang Liang and Jianzhe Zhao and Guibing Guo and Xingwei Wang", title = "Symmetric Graph Contrastive Learning against Noisy Views for Recommendation", journal = j-TOIS, volume = "43", number = "3", pages = "80:1--80:??", month = may, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3722103", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 20 07:06:58 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Graph Contrastive Learning (GCL) leverages data augmentation techniques to produce contrasting views, enhancing the accuracy of recommendation systems through learning the consistency between contrastive views. However, existing augmentation methods, \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "80", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Bron:2025:UCE, author = "Michiel Bron and Peter G. M. van der Heijden and Ad Feelders and Arno Siebes", title = "Using {Chao}'s Estimator as a Stopping Criterion for Technology-Assisted Review", journal = j-TOIS, volume = "43", number = "3", pages = "81:1--81:??", month = may, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3724116", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 20 07:06:58 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Technology-Assisted Review aims to reduce the human effort required for screening processes such as abstract screening for Systematic Literature Reviews. Human reviewers label documents as relevant or irrelevant during this process, while the system \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "81", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Su:2025:IEF, author = "Yixin Su and Wei Jiang and Fangquan Lin and Cheng Yang and Sarah M. Erfani and Junhao Gan and Yunxiang Zhao and Ruixuan Li and Rui Zhang", title = "Intrinsic and Extrinsic Factor Disentanglement for Recommendation in Various Context Scenarios", journal = j-TOIS, volume = "43", number = "3", pages = "82:1--82:??", month = may, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3722553", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 20 07:06:58 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "In recommender systems, the patterns of user behaviors (e.g., purchase, click) may vary greatly in different contexts (e.g., time and location). This is because user behavior is jointly determined by two types of factors: intrinsic factors, which reflect \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "82", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Li:2025:MGS, author = "Xiaoxi Li and Jiajie Jin and Yujia Zhou and Yuyao Zhang and Peitian Zhang and Yutao Zhu and Zhicheng Dou", title = "From Matching to Generation: a Survey on Generative Information Retrieval", journal = j-TOIS, volume = "43", number = "3", pages = "83:1--83:??", month = may, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3722552", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Tue May 20 07:06:58 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Information Retrieval (IR) systems are crucial tools for users to access information, which have long been dominated by traditional methods relying on similarity matching. With the advancement of pre-trained language models, Generative Information \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "83", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Liu:2025:ESP, author = "Jiongnan Liu and Zhicheng Dou and Jian-Yun Nie and Zhenlin Chen and Guoyu Tang and Sulong Xu and Ji-Rong Wen", title = "Enhancing Sequential Personalized Product Search with External Out-of-sequence Knowledge", journal = j-TOIS, volume = "43", number = "4", pages = "84:1--84:??", month = jul, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3726864", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jul 26 09:14:44 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "A key challenge in personalized product search is to capture user's preferences. Recent work attempted to model sequences of user historical behaviors, i.e., product purchase histories, to build user profiles and to personalize results accordingly. \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "84", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Xu:2025:HVJ, author = "Nuo Xu and Pinghui Wang and Zi Liang and Junzhou Zhao and Xiaohong Guan", title = "How Vital Is the Jurisprudential Relevance: Law Article-Intervened Legal Case Retrieval and Matching", journal = j-TOIS, volume = "43", number = "4", pages = "85:1--85:??", month = jul, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3725729", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jul 26 09:14:44 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Legal case retrieval aims to automatically scour comparable legal cases based on a given query, which is crucial for offering relevant precedents to support the judgment in intelligent legal systems. Due to similar goals, it is often associated with a \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "85", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wang:2025:LHF, author = "Huili Wang and Chuhan Wu and Yongfeng Huang and Tao Qi", title = "Learning Human Feedback from Large Language Models for Content Quality-aware Recommendation", journal = j-TOIS, volume = "43", number = "4", pages = "86:1--86:??", month = jul, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3727144", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jul 26 09:14:44 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Recommender systems are widely employed to mitigate information overload by tailoring online content to individual preferences. Existing recommendation methods typically focus on optimizing the relevance between candidate item content and user historical \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "86", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Ruan:2025:CCP, author = "Shulan Ruan and Huijie Liu and Zhao Chen and Bin Feng and Kun Zhang and Caleb Chen Cao and Enhong Chen and Lei Chen", title = "{CPWS}: Confident Programmatic Weak Supervision for High-Quality Data Labeling", journal = j-TOIS, volume = "43", number = "4", pages = "87:1--87:??", month = jul, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3725730", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jul 26 09:14:44 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Programmatic Weak Supervision (PWS) is a recent data labeling paradigm, which employs several Labeling Functions (LFs) to provide weak labels and involves a Label Model (LM) for label aggregation. Despite the significant progress, there still remain some \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "87", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Hu:2025:HTM, author = "Shirui Hu and Weichang Wu and Zuoli Tang and Zhaoxin Huan and Lin Wang and Xiaolu Zhang and Jun Zhou and Lixin Zou and Chenliang Li", title = "{HORAE}: Temporal Multi-Interest Pre-training for Sequential Recommendation", journal = j-TOIS, volume = "43", number = "4", pages = "88:1--88:??", month = jul, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3727645", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jul 26 09:14:44 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The data sparsity problem has been a long-standing obstacle towards achieving better recommendation performance since it is miserable to estimate the user's interests from limited historical behaviors. The pre-training paradigm, i.e., learning universal \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "88", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wang:2025:EEE, author = "Jinguang Wang and Shengsheng Qian and Jun Hu and Wenxiang Dong and Xudong Huang and Richang Hong", title = "End-to-End Explainable Fake News Detection Via Evidence-Claim Variational Causal Inference", journal = j-TOIS, volume = "43", number = "4", pages = "89:1--89:??", month = jul, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3728462", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jul 26 09:14:44 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Explainable Fake News Detection (EFND) is a new challenge that aims to verify news authenticity and provide clear explanations for its decisions. Traditional EFND methods often treat the tasks of classification and explanation as separate, ignoring the \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "89", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wang:2025:HGN, author = "Shuliang Wang and Jiabao Zhu and Yi Wang and Chen Ma and Xin Zhao and Yansen Zhang and Ziqiang Yuan and Sijie Ruan", title = "Hierarchical Gating Network for Cross-Domain Sequential Recommendation", journal = j-TOIS, volume = "43", number = "4", pages = "90:1--90:??", month = jul, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3715321", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jul 26 09:14:44 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Cross-domain sequential recommendation (CDSR) utilizes data from multiple domains to recommend the user's next interaction based on his latest interaction sequence. Currently, many cross-domain sequential recommendation algorithms have been proven to \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "90", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Qiao:2025:MVI, author = "Shutong Qiao and Wei Zhou and Junhao Wen and Chen Gao and Qun Luo and Peixuan Chen and Yong Li", title = "Multi-view Intent Learning and Alignment with Large Language Models for Session-based Recommendation", journal = j-TOIS, volume = "43", number = "4", pages = "91:1--91:??", month = jul, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3719344", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jul 26 09:14:44 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Session-based recommendation (SBR) methods often rely on user behavior data, which can struggle with the sparsity of session data, limiting performance. Researchers have identified that beyond behavioral signals, rich semantic information in item \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "91", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Sritrakool:2025:QDL, author = "Nakarin Sritrakool and Saranya Maneeroj and Atsuhiro Takasu", title = "{QUADEN}: Discovering Latent Neighbors for Sparse Users and Items across Interaction Quadrants in Recommender System", journal = j-TOIS, volume = "43", number = "4", pages = "92:1--92:??", month = jul, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3725886", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jul 26 09:14:44 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Many recommender systems leverage Graph Neural Networks to capture user-item relations for delivering recommendations. However, the representation of nodes heavily relies on neighbors, causing limited neighbor nodes (sparse nodes) to lack expressive \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "92", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Jian:2025:GAS, author = "Meng Jian and Tuo Wang and Zhuoyang Xia and Ge Shi and Richang Hong and Lifang Wu", title = "Geometric-Augmented Self-Distillation for Graph-Based Recommendation", journal = j-TOIS, volume = "43", number = "4", pages = "93:1--93:??", month = jul, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3729223", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jul 26 09:14:44 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The prevalent recommendation techniques explore the graph structure of interactions to alleviate the interaction sparsity issue for inferring users' interests. These graph models focus on extracting local structural signals to model users' interests, \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "93", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Qin:2025:PTO, author = "Yifang Qin and Wei Ju and Yiyang Gu and Ziyue Qiao and Zhiping Xiao and Ming Zhang", title = "{PolyCF}: Towards Optimal Spectral Graph Filters for Collaborative Filtering", journal = j-TOIS, volume = "43", number = "4", pages = "94:1--94:??", month = jul, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3728464", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jul 26 09:14:44 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Collaborative Filtering (CF) is a pivotal research area in recommender systems that capitalizes on collaborative similarities between users and items to provide personalized recommendations. With the remarkable achievements of node embedding-based Graph \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "94", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Yuan:2025:HCH, author = "Meng Yuan and Zhao Zhang and Wei Chen and Chu Zhao and Tong Cai and Deqing Wang and Rui Liu and Fuzhen Zhuang", title = "{HEK-CL}: Hierarchical Enhanced Knowledge-Aware Contrastive Learning for Recommendation", journal = j-TOIS, volume = "43", number = "4", pages = "95:1--95:??", month = jul, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3728463", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jul 26 09:14:44 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Recently, there has been an emergence of self-supervised recommendation methods that integrate knowledge graphs. Upon conducting a comprehensive review of contrastive learning (CL) in recommender systems, we conclude that existing methods solely focus on \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "95", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Huang:2025:RAA, author = "Xu Huang and Jianxun Lian and Yuxuan Lei and Jing Yao and Defu Lian and Xing Xie", title = "Recommender {AI} Agent: Integrating Large Language Models for Interactive Recommendations", journal = j-TOIS, volume = "43", number = "4", pages = "96:1--96:??", month = jul, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3731446", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jul 26 09:14:44 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Recommender models capture ever-changing user preferences by training with in-domain user behavior data. These models are typically lightweight, facilitating real-time and large-scale online services. However, these models often falter when tasked with \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "96", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Adalia:2025:LFP, author = "Ramon Ad{\`a}lia and Gemma Sanjuan and Tom{\`a}s Margalef and Ismael Zamora", title = "The {LambdaGap} Framework for Precision-Oriented Ranking", journal = j-TOIS, volume = "43", number = "4", pages = "97:1--97:??", month = jul, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3733235", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jul 26 09:14:44 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "LambdaRank has proven effective for optimizing information retrieval metrics such as Normalized Discounted Cumulative Gain (NDCG). However, its application to Precision at document k (P@ k ) poses significant challenges because of the metric's unique \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "97", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Chu:2025:PDA, author = "Yuxing Chu and Mingxu Sun and Ke Huang and Haokun Geng and Yanyu Zhang and Lili Zhang and Menghua Zhang", title = "Personality Dialogue Agent Based on Personality Description and Conversation History", journal = j-TOIS, volume = "43", number = "4", pages = "98:1--98:??", month = jul, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3731679", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jul 26 09:14:44 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "In the study of dialogue system, personalized dialogue mainly focuses on the semantic matching degree between response and role. However, various factors, such as semantic style, dialogue noise, and sparse personality information, can affect the \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "98", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Li:2025:PLR, author = "Fei Li and Enneng Yang and Guibing Guo and Linying Jiang and Jianzhe Zhao and Xingwei Wang", title = "Preference Logical Reasoning with Preference Operators for Explainable Recommendations", journal = j-TOIS, volume = "43", number = "4", pages = "99:1--99:??", month = jul, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3733596", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jul 26 09:14:44 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Preference logical reasoning utilizes user-item interactions (e.g., ratings and reviews) to infer user preferences and discover user decision paths from the knowledge graph to enhance the explainability of item recommendations. However, existing \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "99", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wang:2025:NPE, author = "Tairan Wang and Xiuying Chen and Qingqing Zhu and Taicheng Guo and Shen Gao and Zhiyong Lu and Xin Gao and Xiangliang Zhang", title = "New Paradigm for Evaluating Scholar Summaries: a Facet-aware Metric and a Meta-evaluation Benchmark", journal = j-TOIS, volume = "43", number = "4", pages = "100:1--100:??", month = jul, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3733597", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jul 26 09:14:44 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Evaluation of summary quality is particularly crucial within the scientific domain, because it facilitates efficient knowledge dissemination and automated scientific information retrieval. This article presents conceptual and experimental analyses of \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "100", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Yu:2025:UGP, author = "Qing Yu and Lixin Zou and Xiangyang Luo and Xiangyu Zhao and Chenliang Li", title = "Uniform Graph Pre-training and Prompting for Transferable Recommendation", journal = j-TOIS, volume = "43", number = "4", pages = "101:1--101:??", month = jul, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3724392", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jul 26 09:14:44 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Recently, the paradigm of pre-training and fine-tuning has achieved impressive performance owing to their ability to transfer general knowledge from pre-trained domain to target domain. Meanwhile, graph neural networks (GNNs) have gained prominence in \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "101", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Liu:2025:GCQ, author = "Bulou Liu and Yiran Hu and Qingyao Ai and Yiqun Liu and Yueyue Wu and Chenliang Li and Weixing Shen", title = "Generating Clarifying Questions for Conversational Legal Case Retrieval without External Knowledge", journal = j-TOIS, volume = "43", number = "4", pages = "102:1--102:??", month = jul, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3736161", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jul 26 09:14:44 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "In legal case retrieval, existing work has shown that human-mediated conversational search can improve users' search experience. One of the key problems for a practical conversational search system is how to ask high-quality clarifying questions to \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "102", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Lu:2025:FSL, author = "Ziang Lu and Lei Guo and Xu Yu and Zhiyong Cheng and Xiaohui Han and Lei Zhu", title = "Federated Semantic Learning for Privacy-preserving Cross-domain Recommendation", journal = j-TOIS, volume = "43", number = "4", pages = "103:1--103:??", month = jul, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3728359", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jul 26 09:14:44 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "In the evolving landscape of recommender systems, the challenge of effectively conducting privacy-preserving Cross-domain Recommendation, especially under strict non-overlapping constraints, has emerged as a key focus. Despite extensive research has made \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "103", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Bai:2025:EMT, author = "Ting Bai and Le Huang and Yue Yu and Cheng Yang and Cheng Hou and Zhe Zhao and Chuan Shi", title = "Efficient Multi-task Prompt Tuning for Recommendation", journal = j-TOIS, volume = "43", number = "4", pages = "104:1--104:??", month = jul, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3736403", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jul 26 09:14:44 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "With the expansion of business scenarios, real recommender systems are facing challenges in dealing with the constantly emerging new tasks in multi-task learning frameworks. In this article, we attempt to improve the generalization ability of multi-task \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "104", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Lucchese:2025:EEE, author = "Claudio Lucchese and Franco Maria Nardini and Salvatore Orlando and Raffaele Perego and Alberto Veneri", title = "Explainable, Effective, and Efficient Learning-to-Rank Models Using {ILMART}", journal = j-TOIS, volume = "43", number = "4", pages = "105:1--105:??", month = jul, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3733232", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jul 26 09:14:44 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Learning ranking models that are both explainable and effective is an emerging topic within the research area of explainable AI. Several Learning-to-Rank (LtR) algorithms have been recently proposed that build models that are simple to explain and, at \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "105", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Meng:2025:QPP, author = "Chuan Meng and Negar Arabzadeh and Arian Askari and Mohammad Aliannejadi and Maarten de Rijke", title = "Query Performance Prediction Using Relevance Judgments Generated by Large Language Models", journal = j-TOIS, volume = "43", number = "4", pages = "106:1--106:??", month = jul, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3736402", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jul 26 09:14:44 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Query performance prediction (QPP) aims to estimate the retrieval quality of a search system for a query without human relevance judgments. Previous QPP methods typically return a single scalar value and do not require the predicted values to approximate \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "106", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhao:2025:BSP, author = "Chuang Zhao and Hui Tang and Hongke Zhao and Xiaomeng Li", title = "Beyond Sequential Patterns: Rethinking Healthcare Predictions with Contextual Insights", journal = j-TOIS, volume = "43", number = "4", pages = "107:1--107:??", month = jul, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3733234", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jul 26 09:14:44 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Healthcare predictions, such as readmission prediction, stand as a cornerstone of societal well-being, exerting a profound influence on individual health outcomes and communal vitality. Existing research primarily employs advanced graph neural networks \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "107", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Liang:2025:LEG, author = "Xurong Liang and Tong Chen and Wei Yuan and Hogzhi Yin", title = "Lightweight Embeddings with Graph Rewiring for Collaborative Filtering", journal = j-TOIS, volume = "43", number = "4", pages = "108:1--108:??", month = jul, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3742424", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jul 26 09:14:44 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", note = "See erratum \cite{Liang:2026:ELE}.", abstract = "GNN-based recommender systems have become increasingly popular in academia and industry due to their ability to capture high-order information from user-item interaction graphs. However, as recommendation services scale rapidly and their deployment now \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "108", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Xiang:2025:CGP, author = "Zongyi Xiang and Yan Zhang and Lixin Duan and Hongzhi Yin and Ivor W. Tsang", title = "Coherence-guided Preference Disentanglement for Cross-domain Recommendations", journal = j-TOIS, volume = "43", number = "4", pages = "109:1--109:??", month = jul, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3742855", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jul 26 09:14:44 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Discovering user preferences across different domains is pivotal in cross-domain recommendation systems, particularly when platforms lack comprehensive user-item interactive data. The limited presence of shared users often hampers the effective modeling \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "109", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Yan:2025:UIP, author = "Mingshi Yan and Zhiyong Cheng and Fan Liu and Yingda Lyu and Yahong Han", title = "User Invariant Preference Learning for Multi-Behavior Recommendation", journal = j-TOIS, volume = "43", number = "4", pages = "110:1--110:??", month = jul, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3728465", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jul 26 09:14:44 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "In multi-behavior recommendation scenarios, analyzing users' diverse behaviors, such as click, purchase, and rating, enables a more comprehensive understanding of their interests, facilitating personalized and accurate recommendations. A fundamental \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "110", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wang:2025:PTMb, author = "Wenjie Wang and Zheng Liu and Fuli Feng and Zhicheng Dou and Qingyao Ai and Grace Hui Yang and Defu Lian and Lu Hou and Aixin Sun and Hamed Zamani and Donald Metzler and Maarten de Rijke", title = "Pre-Trained Models for Search and Recommendation: Introduction to the Special Issue --- {Part 2}", journal = j-TOIS, volume = "43", number = "5", pages = "111:1--111:5", month = sep, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3736540", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Oct 4 06:32:40 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "111", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Chen:2025:EIB, author = "Lei Chen and Chen Gao and Xiaoyi Du and Hengliang Luo and Depeng Jin and Yong Li and Meng Wang", title = "Enhancing {ID}-based Recommendation with Large Language Models", journal = j-TOIS, volume = "43", number = "5", pages = "112:1--112:30", month = sep, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3704263", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Oct 4 06:32:40 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Large language models (LLMs) have recently garnered significant attention in various domains, including recommendation systems. Recent research leverages the capabilities of LLMs to improve the performance and user modeling aspects of recommender systems. \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "112", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Luo:2025:RIT, author = "Sichun Luo and Bowei He and Haohan Zhao and Wei Shao and Yanlin Qi and Yinya Huang and Aojun Zhou and Yuxuan Yao and Zongpeng Li and Yuanzhang Xiao and Mingjie Zhan and Linqi Song", title = "{RecRanker}: Instruction Tuning Large Language Model as Ranker for Top-$k$ Recommendation", journal = j-TOIS, volume = "43", number = "5", pages = "113:1--113:31", month = sep, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3705728", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Oct 4 06:32:40 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Large language models (LLMs) have demonstrated remarkable capabilities and have been extensively deployed across various domains, including recommender systems. Prior research has employed specialized prompts to leverage the in-context learning \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "113", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2025:RIF, author = "Junjie Zhang and Ruobing Xie and Yupeng Hou and Xin Zhao and Leyu Lin and Ji-Rong Wen", title = "Recommendation as Instruction Following: a Large Language Model Empowered Recommendation Approach", journal = j-TOIS, volume = "43", number = "5", pages = "114:1--114:37", month = sep, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3708882", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Oct 4 06:32:40 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "In the past few decades, recommender systems have attracted much attention in both research and industry communities. Existing recommendation models mainly learn the underlying user preference from historical behavior data (typically in the forms of item \ldots{})", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "114", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Dong:2025:CTP, author = "Zhiang Dong and Liya Hu and Jingyuan Chen and Zhihua Wang and Fei Wu", title = "Comprehend Then Predict: Prompting Large Language Models for Recommendation with Semantic and Collaborative Data", journal = j-TOIS, volume = "43", number = "5", pages = "115:1--115:26", month = sep, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3716499", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Oct 4 06:32:40 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Recommender systems primarily utilize user-item interactions (i.e., collaborative information) and auxiliary textual information (i.e., semantic information) to infer user preferences and provide recommendations. With the advancement in large language \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "115", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Yang:2025:FPL, author = "Qi Yang and Aleksandr Farseev and Marlo Ongpin and Alfred Huang and Yu-Yi Chu-Farseeva and Da-Min You and Kirill Lepikhin and Sergey Nikolenko", title = "Fusing Predictive and Large Language Models for Actionable Recommendations in Creative Marketing", journal = j-TOIS, volume = "43", number = "5", pages = "116:1--116:31", month = sep, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3725885", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Oct 4 06:32:40 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The opaqueness of modern digital advertising, exemplified by large platforms such as Meta Ads, raises concerns regarding their control over audience targeting, pricing structures, and ad relevancy assessments. Locked in place by network effects, these \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "116", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Fu:2025:UFM, author = "Zichuan Fu and Xiangyang Li and Chuhan Wu and Yichao Wang and Kuicai Dong and Xiangyu Zhao and Mengchen Zhao and Huifeng Guo and Ruiming Tang", title = "A Unified Framework for Multi-Domain {CTR} Prediction via Large Language Models", journal = j-TOIS, volume = "43", number = "5", pages = "117:1--117:33", month = sep, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3698878", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Oct 4 06:32:40 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Multi-Domain Click-Through Rate (MDCTR) prediction is crucial for online recommendation platforms, which involves providing personalized recommendation services to users in different domains. However, current MDCTR models are confronted with the following \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "117", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Tang:2025:OMA, author = "Zuoli Tang and Zhaoxin Huan and Zihao Li and Xiaolu Zhang and Jun Hu and Chilin Fu and Jun Zhou and Lixin Zou and Chenliang Li", title = "One Model for All: Large Language Models Are Domain-Agnostic Recommendation Systems", journal = j-TOIS, volume = "43", number = "5", pages = "118:1--118:27", month = sep, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3705727", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Oct 4 06:32:40 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Sequential recommendation systems aim to predict users' next likely interaction based on their history. However, these systems face data sparsity and cold-start problems. Utilizing data from other domains, known as multi-domain methods, is useful for \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "118", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{He:2025:TTB, author = "Xi He and Yilin Liu and Weikang He and Xin Xing and Xingyu Lu and Yanbing Liu", title = "{TCKT}: Tree-Based Cross-domain Knowledge Transfer for Next {POI} Cold-Start Recommendation", journal = j-TOIS, volume = "43", number = "5", pages = "119:1--119:31", month = sep, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3709137", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Oct 4 06:32:40 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The next point of interest (POI) recommendation task recommends POIs to users that they may be interested in next time based on their historical trajectories. This task holds value for both users and businesses. However, it has consistently faced the \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "119", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Xin:2025:LEC, author = "Haoran Xin and Ying Sun and Chao Wang and Hui Xiong", title = "{LLMCDSR}: Enhancing Cross-Domain Sequential Recommendation with Large Language Models", journal = j-TOIS, volume = "43", number = "5", pages = "120:1--120:33", month = sep, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3715099", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Oct 4 06:32:40 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Cross-Domain Sequential Recommendation (CDSR) aims to predict users' preferences based on historical sequential interactions across multiple domains. Existing works focus on the overlapped users who interact in multiple domains to capture the cross-. \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "120", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Sang:2025:DHG, author = "Lei Sang and Yu Wang and Yiwen Zhang and Xindong Wu", title = "Denoising Heterogeneous Graph Pre-training Framework for Recommendation", journal = j-TOIS, volume = "43", number = "5", pages = "121:1--121:31", month = sep, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3706632", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Oct 4 06:32:40 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Heterogeneous graph neural networks (HGNN) have exhibited significant performance gains by modeling the information propagation process in graph-structured data for recommender systems. However, existing HGNN-based Recommendation still face two challenges:. \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "121", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Lai:2025:WTE, author = "Hanyu Lai and Xiao Liu and Hao Yu and Yifan Xu and Iat Long Iong and Shuntian Yao and Aohan Zeng and Zhengxiao Du and Yuxiao Dong and Jie Tang", title = "{WebGLM}: Towards an Efficient and Reliable {Web}-Enhanced Question-Answering System", journal = j-TOIS, volume = "43", number = "5", pages = "122:1--122:43", month = sep, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3729421", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Oct 4 06:32:40 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "We present WebGLM, an enhanced Large Language Model (LLM)-based retrieval question-answering system based on the ChatGLM3-6B, offering significant improvements over previous systems. We aim to augment a pre-trained LLM with web search and reliable \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "122", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Xiao:2025:ICR, author = "Likang Xiao and Richong Zhang and Junfan Chen and Lei Zhang", title = "Including Co-Relation via Concatenate Operator for Static and Temporal Knowledge Graph Embedding", journal = j-TOIS, volume = "43", number = "5", pages = "123:1--123:26", month = sep, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3733231", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Oct 4 06:32:40 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Knowledge Graph Completion (KGC) aims to complete KGs by predicting missing entities. A common solution for KGC is Knowledge Graph Embedding (KGE), which assumes that semantical similar entities or relationships should possess similar representations in \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "123", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Jing:2025:EAP, author = "Erkang Jing and Yezheng Liu and Yidong Chai and Shuo Yu and Longshun Liu and Yuanchun Jiang and Yang Wang", title = "Emotion-aware Personalized Music Recommendation with a Heterogeneity-aware Deep {Bayesian} Network", journal = j-TOIS, volume = "43", number = "5", pages = "124:1--124:43", month = sep, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3733233", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Oct 4 06:32:40 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Music recommender systems play a critical role in music streaming platforms by providing users with music that they are likely to enjoy. Recent studies have shown that user emotions can influence users' preferences for music moods. However, existing \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "124", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wu:2025:ICP, author = "Yiqing Wu and Ruobing Xie and Zhao Zhang and Xu Zhang and Fuzhen Zhuang and Leyu Lin and Zhanhui Kang and Zhulin An and Yongjun Xu", title = "{ID}-centric Pre-training for Recommendation", journal = j-TOIS, volume = "43", number = "5", pages = "125:1--125:29", month = sep, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3735128", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Oct 4 06:32:40 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Classical sequential recommendation models generally adopt ID embeddings to store knowledge learned from user historical behaviors and represent items. However, these unique IDs are challenging to be transferred to new domains. With the thriving of pre-. \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "125", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Vuong:2025:ICA, author = "Tung Vuong and Pritom Kumar Das and Tuukka Ruotsalo", title = "Incorporating Cognitive Abilities into {Web} Search Re-ranking", journal = j-TOIS, volume = "43", number = "5", pages = "126:1--126:35", month = sep, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3736401", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Oct 4 06:32:40 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Web search ranking models learn from human interactions to improve retrieval performance, but they are presently limited by their use of behavioral factors, such as click-through data or dwell time, that do not account for differences in their users' \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "126", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Lv:2025:DCR, author = "Xiangwei Lv and Guifeng Wang and Jingyuan Chen and Hejian Su and Zhiang Dong and Yumeng Zhu and Beishui Liao and Fei Wu", title = "Debiased Cognition Representation Learning for Knowledge Tracing", journal = j-TOIS, volume = "43", number = "5", pages = "127:1--127:30", month = sep, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3736576", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Oct 4 06:32:40 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Knowledge tracing (KT) is a fundamental task in intelligent education aimed at tracking students' knowledge status and predicting their performance on new questions. The primary challenge in KT is accurately inferring a high-quality representation of \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "127", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhu:2025:CDC, author = "Jiajie Zhu and Yan Wang and Feng Zhu and Zhu Sun", title = "Causal Deconfounding via Confounder Disentanglement for Dual-Target Cross-Domain Recommendation", journal = j-TOIS, volume = "43", number = "5", pages = "128:1--128:33", month = sep, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3737457", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Oct 4 06:32:40 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "In recent years, dual-target Cross-Domain Recommendation (CDR) has been proposed to capture comprehensive user preferences in order to ultimately enhance the recommendation accuracy in both data-richer and data-sparser domains simultaneously. However, in \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "128", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Su:2025:PTL, author = "Weihang Su and Qingyao Ai and Yueyue Wu and Anzhe Xie and Changyue Wang and Yixiao Ma and Haitao Li and Zhijing Wu and Yiqun Liu and Min Zhang", title = "Pre-training for Legal Case Retrieval Based on Inter-Case Distinctions", journal = j-TOIS, volume = "43", number = "5", pages = "129:1--129:27", month = sep, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3735127", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Oct 4 06:32:40 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Legal case retrieval aims to help legal workers find relevant cases related to their cases at hand, which is important for the guarantee of fairness and justice in legal judgments. While recent advances in neural retrieval methods have significantly \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "129", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wu:2025:TTF, author = "Lianwei Wu and Kang Wang and Kunlin Nie and Sensen Guo and Chao Gao and Zhen Wang and Shudong Li", title = "{TFGIN}: Tight-Fitting Graph Inference Network for Table-based Fact Verification", journal = j-TOIS, volume = "43", number = "5", pages = "130:1--130:26", month = sep, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3734520", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Oct 4 06:32:40 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Fact verification task has emerged as an essential research topic recently due to abundant fake news spreading on the Internet. The task based on unstructured data (i.e., news) has achieved great development, but the task based on structured data (i.e., \ldots{})", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "130", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Chen:2025:LBR, author = "Yankai Chen and Yue Que and Xinni Zhang and Chen Ma and Irwin King", title = "Learning Binarized Representations with Pseudo-positive Sample Enhancement for Efficient Graph Collaborative Filtering", journal = j-TOIS, volume = "43", number = "5", pages = "131:1--131:28", month = sep, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3744239", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Oct 4 06:32:40 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Learning vectorized embeddings is fundamental to many recommender systems for user-item matching. To enable efficient online inference, representation binarization, which embeds latent features into compact binary sequences, has recently shown \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "131", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Lin:2025:UHH, author = "Zhenghong Lin and Yanchao Tan and Jiamin Chen and Hengyu Zhang and Chaochao Chen and Shiping Wang and Carl Yang", title = "Unified Heterogeneous Hypergraph Construction for Incomplete Multimedia Recommendation", journal = j-TOIS, volume = "43", number = "5", pages = "132:1--132:31", month = sep, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3745020", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Oct 4 06:32:40 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "In the dynamic environment of multimedia-sharing platforms like X (formerly known as Twitter) and TikTok, multimedia recommendation systems have been widely used to help users discover items of interest. However, traditional approaches often fall short, \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "132", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Yao:2025:NRR, author = "Jing Yao and Xiting Wang and Jianxun Lian and Xiaoyuan Yi and Xing Xie", title = "Neural Recommendation Reasoning with Logic Rules", journal = j-TOIS, volume = "43", number = "5", pages = "133:1--133:28", month = sep, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3742856", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Oct 4 06:32:40 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Explainability is critical for recommender systems to ensure good user experience and facilitate designers to debug. However, generating explanations in recommender systems usually requires large efforts due to the dependency on additional data and case-. \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "133", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Gui:2025:IPV, author = "Xiaoqiang Gui and Guoxian Yu and Jun Wang and Shuguang Han and Qingzhong Li and Yongqing Zheng and Wei Wang", title = "Interaction Privacy Vulnerability in Federated Recommendation and Lossless Countermeasure", journal = j-TOIS, volume = "43", number = "5", pages = "134:1--134:31", month = sep, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3745025", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Oct 4 06:32:40 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Federated Recommendation (FedRec) systems are recognized as privacy-preserving solutions for collaboratively training recommender models without sharing users' private data. However, recent studies have revealed that FedRec systems are vulnerable to \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "134", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wang:2025:ULL, author = "Junmei Wang and Fengjing Zhang and Xiadan Chen and Puyu He and Ellen Anne Huang and Jimmy Xiangji Huang", title = "Utilizing Large Language Model for Conversational Information Seeking via Dual-Query Generation and Joint-Encoding", journal = j-TOIS, volume = "43", number = "5", pages = "135:1--135:30", month = sep, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3742423", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Oct 4 06:32:40 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Conversational retrieval leverages multi-turn conversations to meet users' information needs, and accurately understanding the new intent has become a significant challenge in this field. Recently, the language comprehension and reasoning capabilities of \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "135", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Xu:2025:ATO, author = "Heng-Da Xu and Xian-Ling Mao and Fanshu Sun and Tian-Yi Che and Chun Xu and Heyan Huang", title = "{AgentTOD}: a Task-Oriented Dialogue Agent with a Flexible and Adaptive {API} Calling Paradigm", journal = j-TOIS, volume = "43", number = "5", pages = "136:1--136:32", month = sep, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3745021", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Oct 4 06:32:40 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Task-oriented dialogue (TOD) systems play a vital role in numerous assistance and service scenarios, significantly improving people's daily lives. Conventionally, a TOD system adheres to a fixed paradigm, where it must first extract user goals and query \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "136", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Guo:2025:SEC, author = "Lei Guo and Chenlong Song and Feng Guo and Xiaohui Han and Xiaojun Chang and Lei Zhu", title = "Semantic-enhanced Co-attention Prompt Learning for Non-overlapping Cross-domain Recommendation", journal = j-TOIS, volume = "43", number = "5", pages = "137:1--137:27", month = sep, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3742422", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Oct 4 06:32:40 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Non-overlapping Cross-domain Sequential Recommendation (NCSR) is the task that focuses on domain knowledge transfer without overlapping entities. Compared with traditional Cross-domain Sequential Recommendation (CSR), NCSR poses several challenges: (1) \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "137", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Pan:2025:LDG, author = "Zhiqiang Pan and Chen Gao and Fei Cai and Honghui Chen and Yong Li", title = "Light Dynamic Graph Learning on Temporal Networks", journal = j-TOIS, volume = "43", number = "5", pages = "138:1--138:27", month = sep, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3745024", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Oct 4 06:32:40 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Dynamic graph learning on temporal networks aims to understand the continuous evolution pattern of networks, with an important application on forecasting the future temporal network. Existing methods mainly focus on modeling the structural and temporal \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "138", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Lu:2025:ASB, author = "Xiaodong Lu and Mingzhe Liu and Tongyu Zhu and Leilei Sun and Jibin Wang and Weifeng Lv and Yikun Ban and Deqing Wang", title = "Adaptive Sampling-based Dynamic Graph Learning for Information Diffusion Prediction", journal = j-TOIS, volume = "43", number = "5", pages = "139:1--139:25", month = sep, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3744643", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Oct 4 06:32:40 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Information diffusion prediction, aimed at estimating future interacting users for a given content, is crucial for various applications on online social platforms. Recently, methods based on dynamic graph learning have achieved superior performance. \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "139", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Ma:2025:HNR, author = "Jingwei Ma and Jiahui Wen and Lei Zhu and Mingyang Zhong and Yang Xu and Lei Guo and Hongzhi Yin", title = "{HGDNet}: De-Noised Review-Based Rating Prediction Using Hierarchical Gating and Discriminative Networks", journal = j-TOIS, volume = "43", number = "5", pages = "140:1--140:26", month = sep, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3746282", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Oct 4 06:32:40 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The expressiveness of historical reviews in capturing user preferences has garnered significant attention in recommender systems. However, this technology still has certain limitations. Firstly, irrelevant reviews can introduce noise that may adversely \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "140", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wu:2025:CSU, author = "Hanrui Wu and Yanxin Wu and Nuosi Li and Jia Zhang and Yonghui Xu and Michael K. Ng and Jinyi Long", title = "Cold-start User Recommendation via Heterogeneous Domain Adaptation", journal = j-TOIS, volume = "43", number = "5", pages = "141:1--141:26", month = sep, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3746637", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Oct 4 06:32:40 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "In recommendation systems, cold-start user recommendation is a challenging problem, where precise recommendations are required for users who have not appeared before. Several existing cold-start user recommendation models adopt domain adaptation to \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "141", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Yao:2025:ISI, author = "Lina Yao and Julian McAuley and Yongfeng Zhang and Kun Zhang", title = "Introduction to the Special Issue on Causality Representation Learning in {LLMs}-Driven Recommender Systems", journal = j-TOIS, volume = "43", number = "6", pages = "142:1--142:3", month = nov, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3747838", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Oct 10 05:49:16 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "142", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Xu:2025:CCC, author = "Xiaolong Xu and Hongsheng Dong and Haolong Xiang and Xiyuan Hu and Xiaoyong Li and Xiaoyu Xia and Xuyun Zhang and Lianyong Qi and Wanchun Dou", title = "{C2lRec}: Causal Contrastive Learning for User Cold-start Recommendation with Social Variables", journal = j-TOIS, volume = "43", number = "6", pages = "143:1--143:28", month = nov, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3711858", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Oct 10 05:49:16 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Embedding-based recommender systems rely on historical interactions to model users, which poses challenges for recommending to new users, known as the user cold-start problem. Some approaches incorporate social networks to deduce preferences based on the \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "143", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Yuan:2025:FEF, author = "Wei Yuan and Chaoqun Yang and Guanhua Ye and Tong Chen and Quoc Viet Hung Nguyen and Hongzhi Yin", title = "{FELLAS}: Enhancing Federated Sequential Recommendation with {LLM} as External Services", journal = j-TOIS, volume = "43", number = "6", pages = "144:1--144:24", month = nov, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3709138", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Oct 10 05:49:16 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Sequential recommendation has been widely studied in the recommendation domain since it can capture users' temporal preferences and provide more accurate and timely recommendations. To address user privacy concerns, the combination of federated learning \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "144", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wang:2025:DRW, author = "Hao Wang and Zhichao Chen and Honglei Zhang and Zhengnan Li and Licheng Pan and Haoxuan Li and Mingming Gong", title = "Debiased Recommendation via {Wasserstein} Causal Balancing", journal = j-TOIS, volume = "43", number = "6", pages = "145:1--145:24", month = nov, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3725731", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Oct 10 05:49:16 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Recommendation systems are pivotal in improving user experience on various digital platforms. However, observational training data in recommendation systems introduce selection bias, which leads to a distributional discrepancy between training data and \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "145", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Xu:2025:CSR, author = "Hangtong Xu and Yuanbo Xu and Chaozhuo Li and Fuzhen Zhuang", title = "Causal Structure Representation Learning of Unobserved Confounders in Latent Space for Recommendation", journal = j-TOIS, volume = "43", number = "6", pages = "146:1--146:29", month = nov, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3731447", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Oct 10 05:49:16 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Inferring user preferences from users' historical feedback is a valuable problem in recommender systems. Conventional approaches often rely on the assumption that user preferences in the feedback data are equivalent to the real user preferences without \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "146", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Huang:2025:CTA, author = "Sirui Huang and Qian Li and Haoran Yang and Dianer Yu and Qing Li and Guandong Xu", title = "Causal Time-aware News Recommendations with Large Language Models", journal = j-TOIS, volume = "43", number = "6", pages = "147:1--147:25", month = nov, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3729422", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Oct 10 05:49:16 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Predicting user satisfaction over time is crucial in news recommendations, as users' preferences are significantly influenced by various time-variant factors. Traditional correlation-based recommenders often suffer from redundant relationships, which can \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "147", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wang:2025:IIS, author = "Fan Wang and Lianyong Qi and Weiming Liu and Bowen Yu and Jintao Chen and Yanwei Xu", title = "Inter- and Intra-Similarity Preserved Counterfactual Incentive Effect Estimation for Recommendation Systems", journal = j-TOIS, volume = "43", number = "6", pages = "148:1--148:24", month = nov, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3722104", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Oct 10 05:49:16 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Personalized incentives are crucial for boosting user engagement and increasing platform revenues. Many studies have utilized uplift modeling to estimate the conditional average treatment effects (CATEs) of incentives and then allocate them under cost \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "148", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Yu:2025:CCI, author = "Shuo Yu and Yicong Li and Shuo Wang and Tao Tang and Qiang Zhang and Jingjing Zhou and Ivan Lee and Feng Xia", title = "{CaGE}: a Causality-inspired Graph Neural Network Explainer for Recommender Systems", journal = j-TOIS, volume = "43", number = "6", pages = "149:1--149:29", month = nov, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3729224", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Oct 10 05:49:16 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Generating post hoc causal explanations for graph neural network-based recommender systems is vital for enhancing the credibility and interpretability of recommendations. Existing model-agnostic explainers primarily capture statistical correlations \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "149", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2025:MPB, author = "Guixian Zhang and Guan Yuan and Debo Cheng and Lin Liu and Jiuyong Li and Shichao Zhang", title = "Mitigating Propensity Bias of Large Language Models for Recommender Systems", journal = j-TOIS, volume = "43", number = "6", pages = "150:1--150:26", month = nov, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3736404", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Oct 10 05:49:16 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The rapid development of Large Language Models (LLMs) creates new opportunities for recommender systems, especially by exploiting the side information (e.g., descriptions and analyses of items) generated by these models. However, aligning this side \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "150", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Chen:2025:CVI, author = "Yuzhe Chen and Jie Cao and Youquan Wang and Jia Wu and Huanhuan Chen and Guandong Xu", title = "Causal Variational Inference for Deconfounded Multi-Behavior Recommendation", journal = j-TOIS, volume = "43", number = "6", pages = "151:1--151:26", month = nov, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3745023", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Oct 10 05:49:16 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Multi-Behavior Recommendation (MBR) aims to model personalized user preferences by integrating diverse interaction behaviors (e.g., page view, favorite, add to cart, purchase). However, latent confounders such as contextual influences and social \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "151", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Lu:2025:GEC, author = "Kezhi Lu and Jie Lu and Hanshi Xu and Kairui Guo and Qian Zhang and Hua Lin and Mark Grosser and Yi Zhang and Guangquan Zhang", title = "Genomics-Enhanced Cancer Risk Prediction for Personalized {LLM}-Driven Healthcare Recommender Systems", journal = j-TOIS, volume = "43", number = "6", pages = "152:1--152:30", month = nov, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3745022", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Oct 10 05:49:16 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Cancer risk prediction is a cornerstone of personalized medicine that offers opportunities for early detection and preventive interventions. However, the current models are designed to predict cancer risk face several challenges. First, most rely on \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "152", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Chen:2025:CIF, author = "Weixin Chen and Li Chen and Yongxin Ni and Yuhan Zhao", title = "Causality-Inspired Fair Representation Learning for Multimodal Recommendation", journal = j-TOIS, volume = "43", number = "6", pages = "153:1--153:29", month = nov, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3744240", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Oct 10 05:49:16 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Recently, multimodal recommendations (MMRs) have gained increasing attention for alleviating the data sparsity problem of traditional recommender systems by incorporating modality-based representations. Although MMR exhibits notable improvement in \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "153", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhao:2025:DAU, author = "Xuhao Zhao and Yanmin Zhu and Chunyang Wang and Mengyuan Jing and Wenze Ma and Jiadi Yu and Feilong Tang", title = "Dual-Adaptive Update Strategies-Enhanced Meta-Optimization for User Cold-Start Recommendation", journal = j-TOIS, volume = "43", number = "6", pages = "154:1--154:36", month = nov, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3746634", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Oct 10 05:49:16 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "User cold-start recommendation presents a significant challenge for recommender systems, affecting their overall effectiveness. Meta-learning-based methods have been introduced to address this issue. These methods treat the user cold-start recommendation \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "154", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2025:SMM, author = "Zeyu Zhang and Quanyu Dai and Xiaohe Bo and Chen Ma and Rui Li and Xu Chen and Jieming Zhu and Zhenhua Dong and Ji-Rong Wen", title = "A Survey on the Memory Mechanism of Large Language Model-based Agents", journal = j-TOIS, volume = "43", number = "6", pages = "155:1--155:47", month = nov, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3748302", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Oct 10 05:49:16 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Large language model (LLM)-based agents have recently attracted much attention from the research and industry communities. Compared with original LLMs, LLM-based agents are featured in their self-evolving capability, which is the basis for solving real-. \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "155", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wang:2025:NBL, author = "Zhenhua Wang and Chen Zhang and Ming Ren", title = "A Novel {Benford's Law}-Driven Approach for Detecting Machine-Generated Text", journal = j-TOIS, volume = "43", number = "6", pages = "156:1--156:25", month = nov, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3748305", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Oct 10 05:49:16 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/benfords-law.bib; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Detecting Machine-Generated Text (MGT) is critical for the sustainable development of information systems. Existing studies often overlook the generation inconsistency between AI and human, limiting the effectiveness of detection. This article introduces a novel detection approach, BENADV, and the motivation stems from our recognition that, unlike MGT (probabilistic token prediction), Human-Written Text (HWT) is influenced by individual factors (e.g., personal experience), which constitutes a form of ``manipulation'' at the textual level. Specifically, BENADV is built on our new discovery that MGT adheres more closely to Benford's law compared to HWT. We leverage the adherence patterns as detection mechanisms, and further enhance detection performance through adversarial perturbations controlled by stochastic differential equations. Extensive experiments on general-domain datasets demonstrate that BENADV is SOTA. For instance, on the HC3 dataset, BENADV achieves 99.13\% accuracy and 99.18\% F1, outperforming existing methods by 1.16--7.82\% and 1.37--8.30\%. Moreover, BENADV exhibits remarkable scalability, with its performance consistently exceeding 96\% on vertical domain datasets as AI advances (from GPT-3.5 to GPT-4), far surpassing the 50--60\% performance of existing methods. Notably, BENADV excels in the more challenging short MGT detection. Also, we provide practical insights and discuss implications.", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "156", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Li:2025:ASR, author = "Xiaopeng Li and Lixin Su and Pengyue Jia and Suqi Cheng and Junfeng Wang and Dawei Yin and Xiangyu Zhao", title = "{Agent4Ranking}: Semantic Robust Ranking via Personalized Query Rewriting Using Multi-Agent {LLMs}", journal = j-TOIS, volume = "43", number = "6", pages = "157:1--157:33", month = nov, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3749099", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Oct 10 05:49:16 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Search engines are crucial as they provide an efficient and easy way to access vast amounts of information on the Internet for diverse information needs. User queries, even with a specific need, can differ significantly. Prior research has explored the \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "157", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Guo:2025:CIM, author = "Zhihao Guo and Peng Song and Chenjiao Feng and Kaixuan Yao and Jiye Liang", title = "Causal Inference for Multi-Criteria Rating Recommender Systems", journal = j-TOIS, volume = "43", number = "6", pages = "158:1--158:30", month = nov, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3757737", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Oct 10 05:49:16 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Recommender systems are designed to assist users in discovering interesting items and bringing profits to online platforms. The existing works primarily explore the correlation between historical feedback and model predictions through the data-driven \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "158", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2025:SRG, author = "Qian Zhang and Shoujin Wang and Longbing Cao and Defu Lian and Haibo Zhang and Wenpeng Lu", title = "Semantic Relation Guided Dual-view Contrastive Learning for Session-based Recommendations", journal = j-TOIS, volume = "43", number = "6", pages = "159:1--159:36", month = nov, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3750724", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Oct 10 05:49:16 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Session-based Recommender Systems (SBRSs) aim to recommend the next item to users based on their historical interactions with items within or between sessions. A session is constituted by a sequence of interactions between the user and items within a \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "159", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Chen:2025:DHS, author = "Li Chen and Rui Liu and Yuxiang Zhou and Xudong Ma and Yong Chen and Dell Zhang", title = "Deep Hashing with Semantic Hash Centers for Image Retrieval", journal = j-TOIS, volume = "43", number = "6", pages = "160:1--160:38", month = nov, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3749983", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Oct 10 05:49:16 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/hash.bib; https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Deep hashing presents an effective strategy for large-scale image retrieval. Current hashing methods are generally categorized by their supervision types: point-wise, pairwise, and list-wise. Recent advancements in point-wise methods (e.g., CSQ, MDS) have significantly enhanced retrieval performance across diverse datasets by pre-assigning a hash center to each class, thereby improving the discriminability of the resultant hash codes. However, these methods employ purely data-independent algorithms for generating hash centers, overlooking the semantic connections between different classes, which, we argue, could degrade retrieval performance. To tackle this problem, this article expands on the newly emerged concept of hash centers to introduce semantic hash centers, which posits that hash centers of semantically related classes should exhibit closer Hamming distances, while those of unrelated classes should be more distant.\par Based on this hypothesis, we propose a three-stage framework, termed Semantic Hash Centers (SHC), to produce hash codes that preserve semantics. First, we build a classification network to detect semantic similarities between classes, and utilize a data-dependent approach to similarity calculation that can adapt to varied data distributions. Next, we develop a new optimization algorithm to generate SHC. This algorithm not only maintains semantic relatedness among hash centers but also integrates a constraint to ensure a minimum distance between them, addressing the issue of excessively proximate hash centers potentially impairing retrieval performance. Finally, we train a deep hashing network with the above generated SHC to convert each image into a binary hash code. Experiments on large-scale image retrieval across several public datasets demonstrate that SHC generates more discriminative hash codes, markedly enhancing retrieval performance. Specifically, in terms of the mAP@100, mAP@1000, and mAP@ALL metrics, SHC records average improvements of +6.24\%, +6.68\%, and +10.39\%, respectively, over the most competitive existing methods. The code of our SHC project is available at \url{https://github.com/cc752424640/Deep-Hashing-with-Semantic-Hash-Centers-for-Image-Retrieval}.", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "160", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Su:2025:DAT, author = "Jiajie Su and Chaochao Chen and Yihao Wang and Weiming Liu and Yuyuan Li and Tao Wang and Zhigang Li and Xiaolin Zheng and Jianwei Yin", title = "{DuAda}: Adaptive Targeted Model Poisoning Attack Framework via Dummy User Simulation on Federated Recommendation", journal = j-TOIS, volume = "43", number = "6", pages = "161:1--161:37", month = nov, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3757059", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Oct 10 05:49:16 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Federated Recommendation (FedRec) has been widely applied recently for realizing privacy preservation in recommender systems. However, due to direct uploads of model gradients from all clients, FedRec is vulnerable to potential poisoning attacks. In this \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "161", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Sang:2025:BHG, author = "Lei Sang and Maohao Huang and Yu Wang and Yiwen Zhang and Xindong Wu", title = "Bottlenecked Heterogeneous Graph Contrastive Learning for Robust Recommendation", journal = j-TOIS, volume = "43", number = "6", pages = "162:1--162:36", month = nov, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3750725", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Oct 10 05:49:16 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "In recommender systems, heterogeneous graph neural networks (HGNNs) have demonstrated remarkable efficacy due to their capacity to harness rich auxiliary information within heterogeneous information networks (HINs). However, existing HGNN-based \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "162", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Yu:2025:BLC, author = "Dianer Yu and Qian Li and Huan Huo and Guandong Xu", title = "Breaking the Loop: Causal Learning to Mitigate Echo Chambers in Social Networks", journal = j-TOIS, volume = "43", number = "6", pages = "163:1--163:27", month = nov, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3757738", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Oct 10 05:49:16 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "In social networks, echo chambers form when users primarily encounter information that reinforces their existing views with limited exposure to different perspectives. This self-reinforcing isolation worsens societal issues such as division and declining \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "163", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Jiang:2025:URS, author = "Wenjun Jiang and Song Li and Xueqi Li and Kenli Li and Jie Wu", title = "Uncovering Recommendation Serendipity with Objective Data-driven Factor Investigation", journal = j-TOIS, volume = "43", number = "6", pages = "164:1--164:33", month = nov, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3758092", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Oct 10 05:49:16 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The serendipity recommendation tries to burst the filter bubble while still meeting user interests. However, serendipity itself has not been well understood in the recommendation system. Thus, factor investigation in recommendation serendipity has \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "164", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Chen:2025:PAG, author = "Jiajia Chen and Jiancan Wu and Jiawei Chen and Chongming Gao and Yong Li and Xiang Wang", title = "Position-aware Graph Transformer for Recommendation", journal = j-TOIS, volume = "43", number = "6", pages = "165:1--165:24", month = nov, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3757736", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Oct 10 05:49:16 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Collaborative recommendation fundamentally involves learning high-quality user and item representations from interaction data. Recently, graph convolution networks (GCNs) have advanced the field by utilizing high-order connectivity patterns in \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "165", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Barsamian:2025:CIL, author = "Yann Barsamian and Andr{\'e} Chailloux", title = "Compressing Integer Lists with Contextual Arithmetic Trits", journal = j-TOIS, volume = "43", number = "6", pages = "166:1--166:29", month = nov, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3749098", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Oct 10 05:49:16 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Inverted indexes allow to query large databases without needing to search in the database at each query. An important line of research is to construct inverted indexes that require a rather small space usage while still allowing low timings for \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "166", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Mo:2025:SCS, author = "Fengran Mo and Kelong Mao and Ziliang Zhao and Hongjin Qian and Haonan Chen and Yiruo Cheng and Xiaoxi Li and Yutao Zhu and Zhicheng Dou and Jian-Yun Nie", title = "A Survey of Conversational Search", journal = j-TOIS, volume = "43", number = "6", pages = "167:1--167:50", month = nov, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3759453", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Oct 10 05:49:16 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "As a cornerstone of modern information access, search engines have become indispensable in everyday life. With the rapid advancements in AI and natural language processing (NLP) technologies, particularly large language models (LLMs), search engines have \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "167", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Deng:2025:TGO, author = "Yang Deng and Zifeng Ren and An Zhang and Tat-Seng Chua", title = "Towards Goal-oriented Intelligent Tutoring Systems in Online Education", journal = j-TOIS, volume = "43", number = "6", pages = "168:1--168:26", month = nov, year = "2025", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3760401", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Fri Oct 10 05:49:16 MDT 2025", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Interactive Intelligent Tutoring Systems (ITSs) enhance the learning experience in online education by fostering effective learning through interactive problem-solving. However, many current ITS models do not fully incorporate proactive engagement \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "168", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wu:2026:DNP, author = "Ziqing Wu and Zhu Sun and Dongxia Wang and Lu Zhang and Jie Zhang and Yew-Soon Ong", title = "Decentralized Next Point-of-Interest Recommendation Guided by Willingness to Share", journal = j-TOIS, volume = "44", number = "1", pages = "1:1--1:27", month = jan, year = "2026", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3766066", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 31 08:31:05 MST 2026", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Decentralized learning (DL) has proven to be effective for privacy-preserving next point-of-interest (POI) recommendation by sharing check-in information among users and collaboratively training on-device models. Existing works, however, simply assume \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "1", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{He:2026:UIA, author = "Zhiyu He and Shaorun Zhang and Weizhi Ma and Jiayu Li and Peijie Sun and Qingyao Ai and Yiqun Liu and Min Zhang", title = "User Immersion-aware Short Video Recommendation", journal = j-TOIS, volume = "44", number = "1", pages = "2:1--2:33", month = jan, year = "2026", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3748303", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 31 08:31:05 MST 2026", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Short videos have gained immense popularity, necessitating effective recommender systems that cater to individual preferences. The platforms use advanced algorithms to analyze user engagement and provide videos that satisfy users. A critical factor in \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "2", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2026:SGB, author = "Wen Zhang and Rui Li and Quan Bai and Song Wang", title = "{SparseFraudNet}: a Graph-based Approach for Cold-start Fraud Detection with Information Aggregation", journal = j-TOIS, volume = "44", number = "1", pages = "3:1--3:45", month = jan, year = "2026", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3748719", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 31 08:31:05 MST 2026", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Online reviews play a critical role in influencing consumer's purchasing decision on e-commerce, making them a prime target for manipulation through fraudulent reviews. Although various Fraud Detection (FD) techniques have been presented, a crucial \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "3", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Tang:2026:ERS, author = "Jiakai Tang and Jingsen Zhang and Zihang Tian and Xueyang Feng and Lei Wang and Xu Chen", title = "Explainable Recommendation with Simulated Human Feedback", journal = j-TOIS, volume = "44", number = "1", pages = "4:1--4:31", month = jan, year = "2026", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3758091", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 31 08:31:05 MST 2026", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Recent advancements in explainable recommendation have greatly bolstered user experience by elucidating the decision-making rationale. However, the existing methods actually fail to provide effective feedback signals for potentially better or worse \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "4", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Guo:2026:CCG, author = "Jiafeng Guo and Changjiang Zhou and Ruqing Zhang and Jiangui Chen and Maarten de Rijke and Yixing Fan and Xueqi Cheng", title = "{CorpusBrain++}: a Continual Generative Pre-Training Framework for Knowledge-Intensive Language Tasks", journal = j-TOIS, volume = "44", number = "1", pages = "5:1--5:35", month = jan, year = "2026", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3763233", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 31 08:31:05 MST 2026", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Knowledge-intensive language tasks (KILTs) typically require retrieving relevant documents from trustworthy corpora, e.g., Wikipedia, to produce specific answers. Very recently, a pre-trained generative retrieval model for KILTs, named CorpusBrain, was \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "5", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Wang:2026:LSL, author = "Bohao Wang and Feng Liu and Changwang Zhang and Jiawei Chen and Yudi Wu and Sheng Zhou and Xingyu Lou and Jun Wang and Yan Feng and Chun Chen and Can Wang", title = "{LLM4DSR}: Leveraging Large Language Model for Denoising Sequential Recommendation", journal = j-TOIS, volume = "44", number = "1", pages = "6:1--6:32", month = jan, year = "2026", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3762182", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 31 08:31:05 MST 2026", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Sequential recommenders generate recommendations based on users' historical interaction sequences. However, in practice, these sequences are often contaminated by noisy interactions, which can arise from various factors such as clickbait, the influence \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "6", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Datta:2026:PDB, author = "Suchana Datta and Guglielmo Faggioli and Nicola Ferro and Debasis Ganguly and Cristina Ioana Muntean and Raffaele Perego and Nicola Tonellotto", title = "Projection-Displacement-Based Query Performance Prediction for Embedded Space of Dense Retrievers", journal = j-TOIS, volume = "44", number = "1", pages = "7:1--7:30", month = jan, year = "2026", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3765617", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 31 08:31:05 MST 2026", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Recent advances in representation learning have enabled neural Information Retrieval (IR) systems to use learned dense representations for queries and documents to effectively handle semantics, language nuances, and vocabulary mismatch problems. In \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "7", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhou:2026:SML, author = "Huachi Zhou and Kaijing Yu and Qinggang Zhang and Hao Chen and Daochen Zha and Wenqi Pei and Anthony Kong and Xiao Huang", title = "Self-Monitoring Large Language Models for Click-Through Rate Prediction", journal = j-TOIS, volume = "44", number = "1", pages = "8:1--8:25", month = jan, year = "2026", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3763789", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 31 08:31:05 MST 2026", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Click-through rate prediction tasks estimate interaction probabilities using user-item features (i.e., the combined set of user and item features). LLMs have emerged as a promising approach by organizing these features into prompts and fine-tuning LLMs \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "8", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Faggioli:2026:GDD, author = "Guglielmo Faggioli and Nicola Ferro and Raffaele Perego and Nicola Tonellotto", title = "Getting off the {DIME}: Dimension Pruning via Dimension Importance Estimation for Dense Information Retrieval", journal = j-TOIS, volume = "44", number = "1", pages = "9:1--9:34", month = jan, year = "2026", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3765619", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 31 08:31:05 MST 2026", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Dense Information Retrieval (IR) systems rely on neural networks to embed documents and queries within a latent low-dimensional space. Among the Dense IR approaches, bi-encoders are particularly popular, as they achieve state-of-the-art performance and \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "9", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Deng:2026:MAP, author = "Zhirui Deng and Zhicheng Dou and Yutao Zhu and Ji-Rong Wen", title = "A Model-agnostic Pre-training Framework for Search Result Diversification", journal = j-TOIS, volume = "44", number = "1", pages = "10:1--10:23", month = jan, year = "2026", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3764662", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 31 08:31:05 MST 2026", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Search result diversification focuses on providing relevant and diverse documents covering different users' intents. Intuitively, training an effective and stable search result diversification model needs a large amount of training data. Unfortunately, \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "10", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Deng:2026:SCT, author = "Zhirui Deng and Zhicheng Dou and Yutao Zhu and Ji-Rong Wen", title = "Social Cognitive Theory Enhanced Diversified Recommendation", journal = j-TOIS, volume = "44", number = "1", pages = "11:1--11:24", month = jan, year = "2026", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3767324", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 31 08:31:05 MST 2026", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The diversified recommendation aims to satisfy a user's different preferences and hence alleviates the information cocoon problem. Previous methods focus on increasing the sample probability of interacted items in the long-tail category. However, these \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "11", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhu:2026:LLM, author = "Yutao Zhu and Huaying Yuan and Shuting Wang and Jiongnan Liu and Wenhan Liu and Chenlong Deng and Haonan Chen and Zheng Liu and Zhicheng Dou and Ji-Rong Wen", title = "Large Language Models for Information Retrieval: a Survey", journal = j-TOIS, volume = "44", number = "1", pages = "12:1--12:54", month = jan, year = "2026", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3748304", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 31 08:31:05 MST 2026", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "As a primary means of information acquisition, information retrieval (IR) systems, such as search engines, have integrated themselves into our daily lives. These systems also serve as components of dialogue, question-answering, and recommender systems. \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "12", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Gryshchuk:2026:PDR, author = "Vadym Gryshchuk and Maria Maistro and Christina Lioma and Tuukka Ruotsalo", title = "Predicting Document Relevance from Brain Recordings", journal = j-TOIS, volume = "44", number = "1", pages = "13:1--13:30", month = jan, year = "2026", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3766067", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 31 08:31:05 MST 2026", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Recent neuroimaging studies have revealed the association between relevance and brain responses. However, fundamental questions about how the human brain responds to a human relevance judgement of an entire text document and how such responses could be \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "13", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Hao:2026:IMI, author = "Xiulan Hao and Xinwei Li and Hua Wang and Zhonglong Zheng and Yunliang Jiang and Yanchun Zhang", title = "{ITCoHD-MRec}: an Independent Topological Preference-Aware and Cooperative Hypergraph Diffusion-Based Multimodal Recommender Model", journal = j-TOIS, volume = "44", number = "1", pages = "14:1--14:29", month = jan, year = "2026", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3767337", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 31 08:31:05 MST 2026", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Multimodal recommendation provides richer and more accurate personalized recommendations by jointly modeling user's historical behaviors and different modality of items, such as text, image, audio, and video in online platforms. Most existing work of \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "14", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Li:2026:LRR, author = "Weixian Waylon Li and Tiejun Ma", title = "Learn to Rank Risky Investors: a Case Study of Predicting Retail Traders' Behaviour and Profitability", journal = j-TOIS, volume = "44", number = "1", pages = "15:1--15:33", month = jan, year = "2026", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3768623", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 31 08:31:05 MST 2026", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Identifying risky traders with high profits in financial markets is crucial for market makers, such as trading exchanges, to ensure effective risk management through real-time decisions on regulation compliance and hedging. However, capturing the complex \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "15", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Li:2026:MCH, author = "Xiang Li and Changsheng Shui and Zhongying Zhao and Junyu Dong and Yanwei Yu", title = "Multi-Channel Hypergraph Contrastive Learning for Matrix Completion", journal = j-TOIS, volume = "44", number = "1", pages = "16:1--16:27", month = jan, year = "2026", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3768319", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 31 08:31:05 MST 2026", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Rating is a typical user's explicit feedback that visually reflects how much a user likes a related item. The (rating) matrix completion is essentially a rating prediction process, which is also a significant problem in recommender systems. Recently, \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "16", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Liu:2026:RNI, author = "Yu-An Liu and Ruqing Zhang and Jiafeng Guo and Maarten de Rijke and Yixing Fan and Xueqi Cheng", title = "Robust Neural Information Retrieval: an Adversarial and Out-of-Distribution Perspective", journal = j-TOIS, volume = "44", number = "1", pages = "17:1--17:48", month = jan, year = "2026", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3768153", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 31 08:31:05 MST 2026", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Recent advances in neural information retrieval models have significantly enhanced these models' effectiveness across information retrieval tasks. The robustness of these models, which is essential for ensuring their reliability in practice, has also \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "17", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Ke:2026:LLM, author = "Wenjun Ke and Yifan Zheng and Yining Li and Hengyuan Xu and Dong Nie and Peng Wang and Yao He", title = "Large Language Models in Document Intelligence: a Comprehensive Survey, Recent Advances, Challenges, and Future Trends", journal = j-TOIS, volume = "44", number = "1", pages = "18:1--18:64", month = jan, year = "2026", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3768156", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 31 08:31:05 MST 2026", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "The rapid proliferation of documents has made document intelligence increasingly critical across various industries. In recent years, Large Language Models (LLMs) have dramatically transformed the field of document intelligence, allowing for more \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "18", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Song:2026:CSC, author = "Xuemeng Song and Haoqiang Lin and Haokun Wen and Bohan Hou and Mingzhu Xu and Liqiang Nie", title = "A Comprehensive Survey on Composed Image Retrieval", journal = j-TOIS, volume = "44", number = "1", pages = "19:1--19:54", month = jan, year = "2026", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3767328", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 31 08:31:05 MST 2026", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Composed Image Retrieval (CIR) is an emerging yet challenging task that allows users to search for target images using a multimodal query, comprising a reference image and a modification text specifying the user's desired changes to the reference image. \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "19", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Lin:2026:KGP, author = "Fake Lin and Xi Zhu and Ziwei Zhao and Deqiang Huang and Yu Yu and Xueying Li and Zhi Zheng and Tong Xu and Enhong Chen", title = "Knowledge Graph Pruning for Recommendation", journal = j-TOIS, volume = "44", number = "1", pages = "20:1--20:28", month = jan, year = "2026", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3769107", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 31 08:31:05 MST 2026", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Recent years have witnessed the prosperity of Knowledge Graph-Based Recommendation System (KGRS), which enriches the representation of users, items, and entities by structural knowledge with striking improvement. Nevertheless, its unaffordable \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "20", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhai:2026:PGN, author = "Panyu Zhai and Yanwu Yang and Chunjie Zhang", title = "Periodic Graph Neural Networks for Click-Through Rate Prediction in Online Advertising", journal = j-TOIS, volume = "44", number = "1", pages = "21:1--21:37", month = jan, year = "2026", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3769103", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 31 08:31:05 MST 2026", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "CTR prediction serves as a valuable function to provide indications about the effectiveness of advertising campaigns. Numerous models have been developed to learn dynamic representations and sophisticated feature interactions for CTR prediction. We \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "21", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Li:2026:GIL, author = "Xinyu Li and Chuang Zhao and Hongke Zhao and Likang Wu and Ming He and Jianping Fan", title = "{GANPrompt}: Improving {LLM}-Based Recommendations with {GAN}-Enhanced Diversity Prompts", journal = j-TOIS, volume = "44", number = "1", pages = "22:1--22:36", month = jan, year = "2026", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3769428", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 31 08:31:05 MST 2026", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Large Language Models (LLMs) have demonstrated remarkable proficiency in understanding and generating natural language, with an increasing presence in the field of recommendation systems. However, LLMs still encounter a significant issue known as prompt \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "22", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Dacrema:2026:RAC, author = "Maurizio Ferrari Dacrema and Michael Benigni and Nicola Ferro", title = "Reproducibility and Artifact Consistency of the {SIGIR 2022} Recommender Systems Papers Based on Message Passing", journal = j-TOIS, volume = "44", number = "1", pages = "23:1--23:43", month = jan, year = "2026", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3772275", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 31 08:31:05 MST 2026", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Graph-based techniques relying on neural networks and embeddings have gained attention as a way to develop Recommender Systems (RS) with several papers on the topic presented at SIGIR 2022 and 2023. Given the importance of ensuring that published \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "23", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2026:HAS, author = "Zheng Zhang and Qi Liu and Zirui Hu and Yi Zhan and Zhenya Huang and Weibo Gao and Qingyang Mao and Enhong Chen", title = "A Hybrid Adaptive Sampling Strategy for Fair and Accurate Meta-learned User Modeling", journal = j-TOIS, volume = "44", number = "1", pages = "24:1--24:39", month = jan, year = "2026", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3769296", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 31 08:31:05 MST 2026", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "User modeling serves as a crucial foundation for researchers to capture useful potential characteristics, playing a pivotal role in various applications such as recommender systems. One common challenge in user modeling is the cold-start problem, where \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "24", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2026:RUA, author = "Guangping Zhang and Dongsheng Li and Hansu Gu and Peng Zhang and Tun Lu and Li Shang and Ning Gu", title = "{RECOSIM}: a Universal, Accurate, and Scalable Simulation Framework for Online Community Recommendations", journal = j-TOIS, volume = "44", number = "1", pages = "25:1--25:42", month = jan, year = "2026", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3768342", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 31 08:31:05 MST 2026", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "As recommender systems become increasingly important components in online communities, studying their impact on these communities becomes ever more crucial. Facing the high costs and ethical risks of real-world social experiments, researchers construct \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "25", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Zhang:2026:BTI, author = "Haoyao Zhang and Zhida Qin and Xufeng Liang and Jing Guo and Shuang Li and Tianyu Huang and John C. S. Lui", title = "Beyond Texts: Incorporating Co-occurrences into the Review-based Conversation Recommendation Systems", journal = j-TOIS, volume = "44", number = "1", pages = "26:1--26:32", month = jan, year = "2026", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3771276", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 31 08:31:05 MST 2026", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "Conversational Recommender Systems (CRSs) interact with users through natural language to provide recommendations and generate responses. Due to limited information in conversation, existing works utilize KGs or reviews to improve CRS. Despite \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "26", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Qi:2026:KDR, author = "Lianyong Qi and Jianye Xie and Chunhua Hu and Xiaolong Xu and Haolong Xiang and Haipeng Dai and Rong Gu and Xuyun Zhang and Wanchun Dou", title = "Knowledge-Driven Reasoning for Compatible and Interpretable {API} Recommendation via Teacher {LLM} Distillation", journal = j-TOIS, volume = "44", number = "1", pages = "27:1--27:30", month = jan, year = "2026", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3771772", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 31 08:31:05 MST 2026", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "API recommendation is a crucial task in code intelligence, aiming to suggest suitable APIs for programming queries. Recent efforts have integrated Large Language Models (LLMs) into this task. However, these methods overlook the compatibility between \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "27", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Huang:2026:CSR, author = "Junjie Huang and Jizheng Chen and Jianghao Lin and Jiarui Qin and Ziming Feng and Weinan Zhang and Yong Yu", title = "A Comprehensive Survey on Retrieval Methods in Recommender Systems", journal = j-TOIS, volume = "44", number = "1", pages = "28:1--28:43", month = jan, year = "2026", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3771925", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 31 08:31:05 MST 2026", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", abstract = "In an era dominated by information overload, effective recommender systems are essential for managing the deluge of data across digital platforms. Multi-stage cascade ranking systems are widely used in the industry, with retrieval and ranking being two \ldots{}", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "28", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } @Article{Liang:2026:ELE, author = "Xurong Liang and Tong Chen and Wei Yuan and Hongzhi Yin", title = "Erratum: {Lightweight} Embeddings with Graph Rewiring for Collaborative Filtering", journal = j-TOIS, volume = "44", number = "1", pages = "1:1--1:??", month = jan, year = "2026", CODEN = "ATISET", DOI = "https://doi.org/10.1145/3785705", ISSN = "1046-8188", ISSN-L = "1046-8188", bibdate = "Sat Jan 31 08:31:05 MST 2026", bibsource = "https://www.math.utah.edu/pub/tex/bib/tois.bib", note = "See \cite{Liang:2025:LEG}.", abstract = "This is an erratum for the article ``Lightweight Embeddings with Graph Rewiring for Collaborative Filtering'' published in ACM Trans. Inf. Syst. 43, 4, Article 108 (July 2025), 29 pages.", acknowledgement = ack-nhfb, ajournal = "ACM Trans. Inf. Sys.", articleno = "C1", fjournal = "ACM Transactions on Information Systems (TOIS)", journal-URL = "https://dl.acm.org/loi/tois", } %%% ==================================================================== %%% Cross-referenced entries must come last: @Proceedings{Croft:1989:SCR, editor = "W. Bruce Croft", booktitle = "{SIGIR Conference on Research and Development in Information Retrieval}", title = "{SIGIR Conference on Research and Development in Information Retrieval}", volume = "7(3)", publisher = pub-ACM, address = pub-ACM:adr, pages = "183--316", month = jul, year = "1989", CODEN = "ATISET", ISSN = "1046-8188", bibdate = "Sat Jan 16 19:04:41 MST 1999", bibsource = "Compendex database; https://www.math.utah.edu/pub/tex/bib/tois.bib", series = j-TOIS, abstract = "The conference materials contain 6 papers. The areas covered include formal models, search strategies, hypermedia, storage structures, natural language processing, and knowledge-based architectures, storage on optical disks, hypertext, based help systems, probabilistic retrieval model, information retrieval from an artificial intelligence perspective, document and query texts parsing are the main topics covered. All papers are abstracted and indexed separately.", acknowledgement = ack-nhfb, classification = "723; 903; 922", conference = "SIGIR Conference on Research and Development in Information Retrieval", conferenceyear = "1989", editoraddress = "Amherst, MA, USA", editoraffiliation = "Univ of Massachusetts", journalabr = "ACM Trans Inf Syst", keywords = "Artificial Intelligence; cd-rom Full Text Storage; Computer Interfaces --- Human Factors; Data Storage; Database Systems; Information Retrieval Systems; Knowledge Based Search; Natural Language Processing; Optical; Probabilistic Retrieval Model; Probability; String Text Retrieval", meetingaddress = "Cambridge, MA, USA", meetingdate = "Jun 1989", meetingdate2 = "06/89", }