-
Notifications
You must be signed in to change notification settings - Fork 0
/
references.bib
2115 lines (1932 loc) · 69.1 KB
/
references.bib
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
@PREAMBLE{ "\newcommand{\sigir}[1]{Proceedings of the #1 Annual International
ACM SIGIR Conference on Research and Development in Information
Retrieval}" }
@PREAMBLE{ "\newcommand{\cikm}[1]{Proceedings of the #1 International
Conference on Information and Knowledge Management}" }
@PREAMBLE{ "\newcommand{\wsdm}[1]{Proceedings of the #1 ACM International
Conference on Web Search and Data Mining}" }
@Proceedings{ **key*,
editor = {Xiaofang Zhou},
title = {Database Technologies 2002, Thirteenth Australasian
Database Conference (ADC2002), Monash University,
Melbourne, Victoria, January/February 2002},
booktitle = {ADC},
publisher = {Australian Computer Society},
series = {CRPIT},
volume = {5},
year = {2002},
isbn = {0-909-92583-6},
bibsource = {DBLP, http://dblp.uni-trier.de}
}
@InProceedings{ abadi:column-stores:2008,
author = {Abadi, D. J. and Madden, S. R. and Hachem, N.},
title = {Column-stores vs. row-stores: How different are they
really?},
booktitle = {Proceedings of the 2008 ACM SIGMOD International
Conference on Management of Data},
year = {2008}
}
@InProceedings{ agarwal:fast:2012,
author = {Deepak Agarwal and Maxim Gurevich},
title = {Fast top-k retrieval for model based recommendation},
booktitle = {Proc.\ of the Fifth Int.\ Conf.\ on Web Search and Data
Mining},
year = {2012},
pages = {483-492},
ee = {http://doi.acm.org/10.1145/2124295.2124354},
bibsource = {DBLP, http://dblp.uni-trier.de}
}
@InProceedings{ aly:taily:2013,
title = {Taily: shard selection using the tail of score
distributions},
author = {Aly, Robin and Hiemstra, Djoerd and Demeester, Thomas},
booktitle = {Proceedings of the 36th international ACM SIGIR conference
on Research and development in information retrieval},
pages = {673--682},
year = {2013},
organization = {ACM}
}
@InProceedings{ anh:impact:2002,
author = {Vo Ngoc Anh and Alistair Moffat},
title = {Impact transformation: effective and efficient web
retrieval},
booktitle = {Proc.\ of the 25th Annual Int.\ ACM SIGIR Conf.\ on
Research and Development in Information Retrieval},
year = {2002},
pages = {3-10}
}
@InProceedings{ anh:improved:2002,
author = {Vo Ngoc Anh and Alistair Moffat},
title = {Improved Retrieval Effectiveness Through Impact
Transformation},
booktitle = {Proc.\ of the 13th Australasian Database Conference},
year = {2002},
bibsource = {DBLP, http://dblp.uni-trier.de}
}
@Article{ anh:improved:2006,
author = {V. N. Anh and A. Moffat},
journal = {IEEE Transactions on Knowledge and Data Engineering},
title = {Improved word-aligned binary compression for text
indexing},
year = {2006},
volume = {18},
number = {6},
pages = {857-861},
keywords = {binary codes;data compression;indexing;information
retrieval;text analysis;compressed inverted
indexes;improved word-aligned binary compression;text
indexing;text retrieval system;word-aligned binary coding
carry method;Binary
codes;Compaction;Databases;Decoding;Frequency;Indexing;Information
retrieval;Probability distribution;Data compaction and
compression;Web searching.;binary code;compression;file
organization;indexing methods;inverted index;text retrieval
system;text searching;textual databases},
issn = {1041-4347},
month = {June}
}
@Article{ anh:inverted:2005,
author = "Anh, V. N. and Moffat, A.",
title = "Inverted index compression using word-aligned binary
codes",
journal = "Information Retrieval",
year = "2005",
month = "Jan",
day = "01",
volume = "8",
number = "1",
pages = "151--166",
abstract = "We examine index representation techniques for
document-based inverted files, and present a mechanism for
compressing them using word-aligned binary codes. The new
approach allows extremely fast decoding of inverted lists
during query processing, while providing compression rates
better than other high-throughput representations. Results
are given for several large text collections in support of
these claims, both for compression effectiveness and query
efficiency.",
issn = "1573-7659"
}
@InProceedings{ anh:pruned:2006,
title = {Pruned query evaluation using pre-computed impacts},
author = {Anh, V. N. and Moffat, A.},
booktitle = {\sigir{29th}},
pages = {372--379},
year = {2006}
}
@InProceedings{ anh:simplified:2005,
author = {Vo Ngoc Anh and Alistair Moffat},
title = {Simplified similarity scoring using term ranks},
booktitle = {Proc.\ of the 28th Annual Int.\ ACM SIGIR Conf.\ on
Research and Development in Information Retrieval},
year = {2005},
pages = {226-233},
ee = {http://doi.acm.org/10.1145/1076034.1076075},
bibsource = {DBLP, http://dblp.uni-trier.de}
}
@InProceedings{ anh:vector-space:2001,
title = {Vector-space ranking with effective early termination},
author = {Anh, V. N. and de Kretser, O. and Moffat, A.},
booktitle = {\sigir{24th}},
pages = {35--42},
year = {2001}
}
@InProceedings{ arroyuelo:to:2012,
author = {Arroyuelo, Diego and Gonz\'{a}lez, Sen{\'e}n and Marin,
Mauricio and Oyarz\'{u}n, Mauricio and Suel, Torsten},
title = {To Index or Not to Index: Time-space Trade-offs in Search
Engines with Positional Ranking Functions},
booktitle = {Proceedings of the 35th International ACM SIGIR Conference
on Research and Development in Information Retrieval},
series = {SIGIR '12},
year = {2012},
isbn = {978-1-4503-1472-5},
location = {Portland, Oregon, USA},
pages = {255--264},
numpages = {10},
acmid = {2348320},
publisher = {ACM},
keywords = {positional indexing, text compression for snippet
generation}
}
@InProceedings{ asadi:effectivenessefficiency:2013,
author = {Nima Asadi and Jimmy Lin},
title = {Effectiveness/efficiency tradeoffs for candidate
generation in multi-stage retrieval architectures},
booktitle = {Proc.\ of the 36th Int.\ ACM SIGIR Conf.\ on Research and
Development in Information Retrieval},
year = {2013},
url = {http://doi.acm.org/10.1145/2484028.2484132},
doi = {10.1145/2484028.2484132},
timestamp = {Mon, 03 Nov 2014 17:41:42 +0100},
biburl = {http://dblp.uni-trier.de/rec/bib/conf/sigir/AsadiL13},
bibsource = {dblp computer science bibliography, http://dblp.org}
}
@InProceedings{ asadi:fast:2012,
author = {Asadi, N. and Lin, J.},
title = {Fast candidate generation for two-phase document ranking:
Postings list intersection with bloom filters},
booktitle = {Proceedings of the 21st ACM International Conference on
Information and Knowledge Management},
year = {2012},
pages = {2419--2422},
numpages = {4}
}
@PhDThesis{ asadi:multi-stage:2013,
author = {N. Asadi},
title = {Multi-Stage Search Architectures for Streaming Documents},
school = {University of Maryland},
year = {2013}
}
@InProceedings{ baeza-yates:efficiency:2009,
title = {Efficiency trade-offs in two-tier web search systems},
author = {Baeza-Yates, Ricardo and Murdock, Vanessa and Hauff,
Claudia},
booktitle = {Proceedings of the 32nd international ACM SIGIR conference
on Research and development in information retrieval},
pages = {163--170},
year = {2009},
organization = {ACM}
}
@Book{ baeza-yates:modern:1999,
author = {Ricardo A. Baeza-Yates and Berthier A. Ribeiro-Neto},
title = {Modern Information Retrieval},
publisher = {ACM Press / Addison-Wesley},
year = {1999},
isbn = {0-201-39829-X},
bibsource = {DBLP, http://dblp.uni-trier.de}
}
@Article{ barroso:web:2003,
title = {Web search for a planet: The Google cluster architecture},
author = {Barroso, Luiz Andr{\'e} and Dean, Jeffrey and Holzle, Urs},
journal = {IEEE micro},
volume = {23},
number = {2},
pages = {22--28},
year = {2003},
publisher = {IEEE}
}
@InProceedings{ bast:io-top-k:2006,
author = {Holger Bast and Debapriyo Majumdar and Ralf Schenkel and
Martin Theobald and Gerhard Weikum },
title = {{IO}-{Top}-{K}: Index-access Optimized Top-k Query
Processing},
booktitle = {Proc.\ of the 32th Int.\ Conf.\ on Very Large Data Bases},
year = {2006}
}
@InProceedings{ bay:surf:2006,
title = {Surf: Speeded up robust features},
author = {Bay, H. and Tuytelaars, T. and Van Gool, L.},
booktitle = {Proceedings of the 9th European Conference on Computer
Vision},
pages = {404--417},
year = {2006},
publisher = {Springer}
}
@InProceedings{ bendersky:analysis:2009,
author = {Bendersky, M. and Croft, W. B.},
title = {Analysis of long queries in a large scale search log},
booktitle = {Proceedings of the 2009 Workshop on Web Search Click
Data},
year = {2009},
pages = {8--14},
numpages = {7}
}
@Article{ bentley:multidimensional:1975,
title = {Multidimensional binary search trees used for associative
searching},
author = {Bentley, J. L.},
journal = {Communications of the ACM},
volume = {18},
number = {9},
pages = {509--517},
year = {1975},
publisher = {ACM}
}
@InProceedings{ beyer:when:1999,
title = {When is “nearest neighbor” meaningful?},
author = {Beyer, K. and Goldstein, J. and Ramakrishnan, R. and
Shaft, U.},
booktitle = {Proceedings of the 7th International Conference on
Database Theory},
pages = {217--235},
year = {1999}
}
@InProceedings{ blanco:document:2005,
title = {Document identifier reassignment through dimensionality
reduction},
author = {Blanco, Roi and Barreiro, {\'A}lvaro},
booktitle = {European Conference on Information Retrieval},
pages = {375--387},
year = {2005},
organization = {Springer}
}
@Article{ blanco:probabilistic:2010,
author = "Roi Blanco and Alvaro Barreiro",
title = "Probabilistic static pruning of inverted files",
journal = " ACM Transactions on Information Systems ",
volume = "28",
number = "1",
month = jan,
year = "2010"
}
@InProceedings{ blandford:index:2002,
author = {Blandford, D. and Blelloch, G.},
title = {Index compression through document reordering},
booktitle = {Proceedings of the 2002 Data Compression Conference},
pages = {342--351},
year = {2002}
}
@InProceedings{ boldi:mg4j:2005,
title = "{M}{G}4{J} at {T}{R}{E}{C} 2005",
author = "Paolo Boldi and Sebastiano Vigna",
year = 2005,
booktitle = "The Fourteenth Text REtrieval Conference (TREC 2005)
Proceedings",
editor = "Ellen M. Voorhees and Lori P. Buckland",
publisher = "NIST",
series = "Special Publications",
number = "SP 500-266",
note = "\texttt{\small http://mg4j.di.unimi.it/}"
}
@Article{ boldi:permuting:2009,
author = "Boldi, P. and Santini, M. and Vigna, S.",
journal = "Internet Mathematics.",
number = "3",
pages = "257--283",
title = "Permuting web and social graphs",
volume = "6",
year = "2009"
}
@Article{ breiman:random:2001,
author = "Breiman, Leo",
title = "Random Forests",
journal = "Machine Learning",
year = "2001",
volume = "45",
number = "1",
pages = "5--32",
abstract = "Random forests are a combination of tree predictors such
that each tree depends on the values of a random vector
sampled independently and with the same distribution for
all trees in the forest. The generalization error for
forests converges a.s. to a limit as the number of trees in
the forest becomes large. The generalization error of a
forest of tree classifiers depends on the strength of the
individual trees in the forest and the correlation between
them. Using a random selection of features to split each
node yields error rates that compare favorably to Adaboost
(Y. Freund {\&} R. Schapire, Machine Learning: Proceedings
of the Thirteenth International conference, ***, 148--156),
but are more robust with respect to noise. Internal
estimates monitor error, strength, and correlation and
these are used to show the response to increasing the
number of features used in the splitting. Internal
estimates are also used to measure variable importance.
These ideas are also applicable to regression.",
issn = "1573-0565",
doi = "10.1023/A:1010933404324",
url = "http://dx.doi.org/10.1023/A:1010933404324"
}
@Article{ brin:anatomy:1998,
author = {Sergey Brin and Lawrence Page},
title = {The Anatomy of a Large-Scale Hypertextual Web Search
Engine},
journal = {Computer Networks},
year = {1998},
volume = {30},
number = {1-7},
pages = {107--117},
url = {http://dx.doi.org/10.1016/S0169-7552(98)00110-X},
doi = {10.1016/S0169-7552(98)00110-X},
timestamp = {Thu, 06 Nov 2014 01:39:54 +0100},
biburl = {http://dblp.uni-trier.de/rec/bib/journals/cn/BrinP98},
bibsource = {dblp computer science bibliography, http://dblp.org}
}
@Article{ brin:reprint:2012,
title = {Reprint of: The anatomy of a large-scale hypertextual web
search engine},
author = {Brin, S. and Page, L.},
journal = {Computer Networks},
volume = {56},
number = {18},
pages = {3825--3833},
year = {2012}
}
@InProceedings{ broder:efficient:2003,
author = {Broder, A. Z. and Carmel, D. and Herscovici, M. and
Soffer, A. and Zien, J.},
title = {Efficient query evaluation using a two-level retrieval
process},
booktitle = {\cikm{12th}},
year = {2003},
pages = {426--434},
numpages = {9}
}
@Article{ broschart:high-performance:2012,
author = {Andreas Broschart and Ralf Schenkel},
title = {High-performance processing of text queries with tunable
pruned term and term pair indexes},
journal = {{ACM} Trans. Inf. Syst.},
year = {2012},
volume = {30},
number = {1},
pages = {5},
url = {http://doi.acm.org/10.1145/2094072.2094077},
doi = {10.1145/2094072.2094077},
timestamp = {Sat, 08 Nov 2014 18:45:49 +0100},
biburl = {http://dblp.uni-trier.de/rec/bib/journals/tois/BroschartS12},
bibsource = {dblp computer science bibliography, http://dblp.org}
}
@InProceedings{ buttcher:document-centric:2006,
author = {Stefan B{\"{u}}ttcher and Charles L. A. Clarke},
title = {A document-centric approach to static index pruning in
text retrieval systems},
booktitle = {Proc.\ of the 15th {ACM} Conf.\ Information and Knowledge
Management},
year = {2006},
url = {http://doi.acm.org/10.1145/1183614.1183644},
doi = {10.1145/1183614.1183644},
timestamp = {Sun, 09 Nov 2014 01:31:34 +0100},
biburl = {http://dblp.uni-trier.de/rec/bib/conf/cikm/ButtcherC06},
bibsource = {dblp computer science bibliography, http://dblp.org}
}
@Misc{ callan:clueweb09:2009,
title = {Clueweb09 data set},
author = {Callan, J. and Hoy, M. and Yoo, C. and Zhao, L.},
year = {2009},
url = {http://lemurproject.org/clueweb09/}
}
@InProceedings{ callan:searching:1995,
title = {Searching distributed collections with inference
networks},
author = {Callan, James P and Lu, Zhihong and Croft, W Bruce},
booktitle = {Proceedings of the 18th annual international ACM SIGIR
conference on Research and development in information
retrieval},
pages = {21--28},
year = {1995},
organization = {ACM}
}
@InCollection{ callan:distributed:2002,
title = {Distributed information retrieval},
author = {Callan, Jamie},
booktitle = {Advances in information retrieval},
pages = {127--150},
year = {2002},
publisher = {Springer}
}
@InProceedings{ cambazoglu:early:2010,
author = {Berkant Barla Cambazoglu and Hugo Zaragoza and Olivier
Chapelle and Jiang Chen and Ciya Liao and Zhaohui Zheng and
Jon Degenhardt},
title = {Early exit optimizations for additive machine learned
ranking systems},
booktitle = {Proc.\ of the Third Int.\ Conf.\ on Web Search and Data
Mining},
year = {2010},
url = {http://doi.acm.org/10.1145/1718487.1718538},
doi = {10.1145/1718487.1718538},
timestamp = {Mon, 03 Nov 2014 17:39:29 +0100},
biburl = {http://dblp.uni-trier.de/rec/bib/conf/wsdm/CambazogluZCCLZD10},
bibsource = {dblp computer science bibliography, http://dblp.org}
}
@InProceedings{ cambazoglu:quantifying:2009,
title = {Quantifying performance and quality gains in distributed
web search engines},
author = {Cambazoglu, B Barla and Plachouras, Vassilis and
Baeza-Yates, Ricardo},
booktitle = {Proceedings of the 32nd international ACM SIGIR conference
on Research and development in information retrieval},
pages = {411--418},
year = {2009},
organization = {ACM}
}
@InCollection{ castellanos:hotminer:2004,
title = {Hotminer: Discovering hot topics from dirty text},
author = {Castellanos, Mal{\'u}},
booktitle = {Survey of Text Mining},
pages = {123--157},
year = {2004},
publisher = {Springer}
}
@InProceedings{ chakrabarti:interval-based:2011,
author = {Kaushik Chakrabarti and Surajit Chaudhuri and Venkatesh
Ganti},
title = {Interval-based pruning for top-k processing over
compressed lists},
booktitle = {Proc.\ of the 27th Int.\ Conf.\ on Data Engineering},
year = {2011},
ee = {http://doi.ieeecomputersociety.org/10.1109/ICDE.2011.5767855},
bibsource = {DBLP, http://dblp.uni-trier.de}
}
@InProceedings{ chaudhuri:heavy-tailed:2007,
author = {Surajit Chaudhuri and Kenneth Ward Church and Arnd
Christian K{\"{o}}nig and Liying Sui},
title = {Heavy-tailed distributions and multi-keyword queries},
booktitle = {Proc.\ of the 30th Annual Int.\ ACM SIGIR Conf},
year = {2007},
bibsource = {dblp computer science bibliography, http://dblp.org}
}
@InProceedings{ chierichetti:on:2009,
author = {Chierichetti, F. and Kumar, R. and Lattanzi, S. and
Mitzenmacher, M. and Panconesi, A. and Raghavan, P.},
title = {On compressing social networks},
booktitle = {Proceedings of the 15th ACM SIGKDD International
Conference on Knowledge Discovery and Data Mining},
year = {2009}
}
@InProceedings{ chougrad:soft:2015,
author = {H. Chougrad and H. Zouaki and O. Alheyane},
booktitle = {2015 10th International Conference on Intelligent Systems:
Theories and Applications (SITA)},
title = {Soft assignment vs hard assignment coding for bag of
visual words},
year = {2015},
volume = {},
number = {},
pages = {},
keywords = {image classification;image coding;image
representation;image retrieval;bag-of-visual word;hard
assignment coding;image classification;image
representation;image retrieval;machine level language;soft
assignment coding;soft-assignment technique;vector
quantization process;Encoding;Feature extraction;Image
coding;Support vector
machines;Testing;Training;Visualization;bag of visual
words;image classification;locality-constrained linear
coding;pooling;soft-assignment},
issn = {},
month = {Oct}
}
@Article{ cormack:efficient:2011,
author = {Gordon V. Cormack and Mark D. Smucker and Charles L. A.
Clarke},
title = {Efficient and effective spam filtering and re-ranking for
large web datasets},
journal = {Inf. Retr.},
volume = {14},
number = {5},
year = {2011},
pages = {441-465},
ee = {http://dx.doi.org/10.1007/s10791-011-9162-z},
bibsource = {DBLP, http://dblp.uni-trier.de}
}
@Article{ cornacchia:flexible:2008,
author = {Roberto Cornacchia and S{\'a}ndor H{\'e}man and Marcin
Zukowski and Arjen P. de Vries and Peter A. Boncz},
title = {Flexible and efficient IR using array databases},
journal = {VLDB J.},
volume = {17},
number = {1},
year = {2008},
pages = {151-168},
ee = {http://dx.doi.org/10.1007/s00778-007-0071-0},
bibsource = {DBLP, http://dblp.uni-trier.de}
}
@InProceedings{ crane:comparison:2017,
title = {A comparison of document-at-a-time and score-at-a-time
query evaluation},
author = {Crane, M. and Culpepper, J. S. and Lin, J. and Mackenzie,
J. and Trotman, A.},
booktitle = {\wsdm{10th}},
pages = {201--210},
year = {2017}
}
@InProceedings{ dang:query:2010,
author = {Van Dang and W. Bruce Croft},
title = {Query reformulation using anchor text},
booktitle = {Proc.\ of the Third Int.\ Conf.\ on Web Search and Data
Mining},
year = {2010},
pages = {41-50},
bibsource = {DBLP, http://dblp.uni-trier.de}
}
@InProceedings{ dang:two-stage:2013,
author = {Van Dang and Michael Bendersky and W. Bruce Croft},
title = {Two-Stage Learning to Rank for Information Retrieval},
booktitle = {Proc.\ of the 35th European Conf.\ on Information
Retrieval},
year = {2013},
url = {http://dx.doi.org/10.1007/978-3-642-36973-5_36},
doi = {10.1007/978-3-642-36973-5_36},
timestamp = {Mon, 03 Nov 2014 17:46:54 +0100},
biburl = {http://dblp.uni-trier.de/rec/bib/conf/ecir/DangBC13},
bibsource = {dblp computer science bibliography, http://dblp.org}
}
@InProceedings{ dean:challenges:2009,
author = { Jeffrey Dean},
title = {Challenges in building large-scale information retrieval
systems},
booktitle = {Proceedings of the Second ACM International Conference on
Web Search and Data Mining },
year = {2009}
}
@InProceedings{ dhillon:information-theoretic:2003,
title = {Information-theoretic co-clustering},
author = {Dhillon, Inderjit S and Mallela, Subramanyam and Modha,
Dharmendra S},
booktitle = {Proceedings of the ninth ACM SIGKDD international
conference on Knowledge discovery and data mining},
pages = {89--98},
year = {2003},
organization = {ACM}
}
@InProceedings{ dimopoulos:candidate:2013,
author = {Constantinos Dimopoulos and Sergey Nepomnyachiy and
Torsten Suel},
title = {A candidate filtering mechanism for fast top-k query
processing on modern cpus},
booktitle = {Proc.\ of the 36th Int.\ ACM SIGIR Conf},
year = {2013},
url = {http://doi.acm.org/10.1145/2484028.2484087},
doi = {10.1145/2484028.2484087},
timestamp = {Fri, 07 Nov 2014 01:58:10 +0100},
biburl = {http://dblp.uni-trier.de/rec/bib/conf/sigir/DimopoulosNS13},
bibsource = {dblp computer science bibliography, http://dblp.org}
}
@InProceedings{ dimopoulos:optimizing:2013,
title = {Optimizing top-k document retrieval strategies for
block-max indexes},
author = {Dimopoulos, C. and Nepomnyachiy, S. and Suel, T.},
booktitle = {\wsdm{6th}},
pages = {113--122},
year = {2013}
}
@InProceedings{ ding:faster:2011,
title = {Faster top-k document retrieval using block-max indexes},
author = {Ding, S. and Suel, T.},
booktitle = {\sigir{34th}},
pages = {993--1002},
year = {2011}
}
@InProceedings{ ding:scalable:2010,
author = {Ding, S. and Attenberg, J. and Suel, T.},
title = {Scalable techniques for document identifier assignment in
inverted indexes},
booktitle = {Proceedings of the 19th International Conference on World
Wide Web},
year = {2010}
}
@InProceedings{ donmez:on:2009,
author = {Pinar Donmez and Krysta Marie Svore and Christopher J. C.
Burges},
title = {On the local optimality of LambdaRank},
booktitle = {Proc.\ of the 32th Int.\ ACM SIGIR Conf.\ on Research and
Development in Information Retrieval},
year = {2009},
url = {http://doi.acm.org/10.1145/1571941.1572021},
doi = {10.1145/1571941.1572021},
timestamp = {Fri, 07 Nov 2014 18:35:13 +0100},
biburl = {http://dblp.uni-trier.de/rec/bib/conf/sigir/DonmezSB09},
bibsource = {dblp computer science bibliography, http://dblp.org}
}
@Article{ duda:asymmetric:2013,
author = {J. Duda},
title = {Asymmetric numeral systems as close to capacity low state
entropy coders},
journal = {CoRR},
volume = {abs/1311.2540},
year = {2013},
url = {http://arxiv.org/abs/1311.2540},
archiveprefix = {arXiv},
eprint = {1311.2540}
}
@InProceedings{ elbagoury:rank-at-a-time:2016,
author = {Elbagoury, A. and Crane, M. and Lin, J.},
title = {Rank-at-a-time query processing},
booktitle = {Proceedings of the 2016 ACM International Conference on
the Theory of Information Retrieval},
year = {2016},
pages = {229--232},
numpages = {4}
}
@Article{ elias:universal:2006,
author = {Elias, P.},
title = {Universal Codeword Sets and Representations of the
Integers},
journal = {IEEE Trans. Inf. Theor.},
issue_date = {March 1975},
volume = {21},
number = {2},
month = sep,
year = {2006},
issn = {0018-9448},
pages = {},
numpages = {10},
acmid = {2268815},
publisher = {IEEE Press},
address = {Piscataway, NJ, USA}
}
@Article{ fagin:optimal:2003,
title = {Optimal aggregation algorithms for middleware},
author = {Fagin, R. and Lotem, A. and Naor, M.},
journal = {Journal of computer and system sciences},
volume = {66},
number = {4},
pages = {614--656},
year = {2003}
}
@InProceedings{ fagin:static:2001,
author = {R. Fagin and D. Carmel and D. Cohen and E. Farchi and M.
Herscovici and Y. Maarek and A. Soffer},
title = {Static index pruning for information retrieval systems},
booktitle = {Proc.\ of the 24th Int.\ ACM SIGIR Conf.\ on Research and
Development in Information Retrieval},
year = {2001}
}
@Article{ fagin:combining:2002,
author = {Ronald Fagin},
title = {Combining Fuzzy Information: an Overview},
journal = {SIGMOD Record},
year = {2002},
volume = {31},
pages = {2002}
}
@Article{ fagni:boosting:2006,
author = {Tiziano Fagni and Raffaele Perego and Fabrizio Silvestri
and Salvatore Orlando},
title = {Boosting the performance of Web search engines: Caching
and prefetching query results by exploiting historical
usage data},
journal = {{ACM} Trans. Inf. Syst.},
volume = {24},
number = {1},
pages = {51--78},
year = {2006},
timestamp = {Tue, 06 Mar 2007 08:54:15 +0100},
biburl = {http://dblp.uni-trier.de/rec/bib/journals/tois/FagniPSO06},
bibsource = {dblp computer science bibliography, http://dblp.org}
}
@InProceedings{ ferragina:on:2010,
author = {Ferragina, P. and Manzini, G.},
title = {On compressing the textual web},
booktitle = {Proceedings of the 3rd ACM International Conference on Web
Search and Data Mining},
year = {2010},
pages = {391--400},
numpages = {10}
}
@Article{ fischler:random:1981,
author = {Fischler, M. A. and Bolles, R. C.},
title = {Random sample consensus: a paradigm for model fitting with
applications to image analysis and automated cartography},
journal = {Readings in Computer Vision},
issue_date = {June 1981},
volume = {24},
number = {6},
month = jun,
year = {1981},
pages = {726--740},
numpages = {15}
}
@InProceedings{ fontoura:efficiently:2011,
author = {Marcus Fontoura and Maxim Gurevich and Vanja Josifovski
and Sergei Vassilvitskii},
title = {Efficiently encoding term co-occurrences in inverted
indexes},
booktitle = {Proc.\ of the 20th {ACM} Conf.\ Information and Knowledge
Management},
year = {2011},
url = {http://doi.acm.org/10.1145/2063576.2063626},
doi = {10.1145/2063576.2063626},
timestamp = {Sat, 08 Nov 2014 19:11:23 +0100},
biburl = {http://dblp.uni-trier.de/rec/bib/conf/cikm/FontouraGJV11},
bibsource = {dblp computer science bibliography, http://dblp.org}
}
@InProceedings{ garcia:access-ordered:2004,
title = {Access-ordered indexes},
author = {Garcia, Steven and Williams, Hugh E and Cannane, Adam},
booktitle = {Proceedings of the 27th Australasian conference on
Computer science-Volume 26},
pages = {7--14},
year = {2004},
organization = {Australian Computer Society, Inc.}
}
@InProceedings{ goel:predictive:2008,
author = {Sharad Goel and John Langford and Alexander L. Strehl},
title = {Predictive Indexing for Fast Search},
booktitle = {Proc.\ of the 22nd Annual Conf.\ on Neural Information
Processing Systems, Vancouver},
year = {2008},
url = {http://books.nips.cc/papers/files/nips21/NIPS2008_0840.pdf},
timestamp = {Mon, 10 Nov 2014 02:18:45 +0100},
biburl = {http://dblp.uni-trier.de/rec/bib/conf/nips/GoelLS08},
bibsource = {dblp computer science bibliography, http://dblp.org}
}
@Article{ gravano:generalizing:1999,
title = {Generalizing GlOSS to vector-space databases and broker
hierarchies},
author = {Gravano, Luis and Garcia-Molina, Hector},
year = {1999},
publisher = {Stanford InfoLab}
}
@Article{ gupta:information:2015,
author = {Manish Gupta and Michael Bendersky},
title = {Information Retrieval with Verbose Queries},
journal = {Foundations and Trends in Information Retrieval},
year = {2015},
volume = {9},
number = {3-4},
pages = {209-354}
}
@Misc{ harman:inverted:1992,
title = {Inverted files},
author = {Harman, D. and Fox, E. and Baeza-Yates, R. and Lee, W.},
year = {1992},
url = {http://orion.lcg.ufrj.br/Dr.Dobbs/books/book5/chap03.htm}
}
@InProceedings{ hinneburg:what:2000,
title = {What is the nearest neighbor in high dimensional spaces?},
author = {Hinneburg, A. and Aggarwal, C. C. and Keim, D. A.},
booktitle = {Proceedings of the 26th International Conference on Very
Large Databases},
pages = {506--515},
year = {2000}
}
@Article{ holloway:read-optimized:2008,
author = {Holloway, A. L. and DeWitt, D. J.},
title = {Read-optimized databases, in depth},
journal = {Proceedings of the VLDB Endowment},
issue_date = {August 2008},
volume = {1},
number = {1},
pages = {502--513},
year = {2008}
}
@InProceedings{ huston:evaluating:2010,
author = {Huston, S. and Croft, W. B.},
title = {Evaluating verbose query processing techniques},
booktitle = {\sigir{33rd}},
year = {2010},
pages = {291--298},
numpages = {8}
}
@Article{ hwang:optimizing:2007,
author = {Seung{-}won Hwang and Kevin Chen{-}Chuan Chang},
title = {Optimizing top-k queries for middleware access: {A}
unified cost-based approach},
journal = {{ACM} Trans. Database Syst.},
volume = {32},
number = {1},
pages = {5},
year = {2007},
url = {http://doi.acm.org/10.1145/1206049.1206054},
doi = {10.1145/1206049.1206054},
timestamp = {Mon, 11 Jun 2007 14:34:07 +0200},
biburl = {http://dblp.uni-trier.de/rec/bib/journals/tods/HwangC07},
bibsource = {dblp computer science bibliography, http://dblp.org}
}
@Article{ ilyas:survey:2008,
author = {Ihab F. Ilyas and George Beskales and Mohamed A. Soliman},
title = {A survey of top-\emph{k} query processing techniques in
relational database systems},
journal = {{ACM} Comput. Surv.},
volume = {40},
number = {4},
year = {2008},
url = {http://doi.acm.org/10.1145/1391729.1391730},
doi = {10.1145/1391729.1391730},
timestamp = {Mon, 03 Nov 2008 16:10:28 +0100},
biburl = {http://dblp.uni-trier.de/rec/bib/journals/csur/IlyasBS08},
bibsource = {dblp computer science bibliography, http://dblp.org}
}
@Article{ jardine:use:1971,
title = "The use of hierarchic clustering in information retrieval",
journal = "Information Storage and Retrieval",
volume = "7",
number = "5",
pages = "217 - 240",
year = "1971",
note = "",
issn = "0020-0271",
doi = "http://dx.doi.org/10.1016/0020-0271(71)90051-9",
url = "http://www.sciencedirect.com/science/article/pii/0020027171900519",
author = "N. Jardine and C.J. van Rijsbergen"
}
@InProceedings{ jia:efficient:2010,
title = {Efficient accumulator initialisation},
author = {Jia, X.-F. and Trotman, A. and O’Keefe, R.},
booktitle = {Proceedings of the 15th Australasian Document Computing
Symposium},
pages = {44--51},
year = {2010}
}
@InProceedings{ jiang:towards:2007,
title = {Towards optimal bag-of-features for object categorization
and semantic video retrieval},
author = {Jiang, Y.-G. and Ngo, C.-W. and Yang, J.},
booktitle = {Proceedings of the 6th ACM international Conference on
Image and Video Retrieval},
pages = {494--501},
year = {2007}
}
@InProceedings{ jonassen:efficient:2011,
author = {Simon Jonassen and Svein Erik Bratsberg},
title = {Efficient Compressed Inverted Index Skipping for
Disjunctive Text-Queries},
booktitle = {Proc.\ of the 33th European Conf.\ on Information
Retrieval},
year = {2011},
ee = {http://dx.doi.org/10.1007/978-3-642-20161-5_53},
bibsource = {DBLP, http://dblp.uni-trier.de}
}
@InProceedings{ kaszkiel:term-ordered:1998,
author = {Kaszkiel, M. and Zobel, J.},
title = {Term-ordered query evaluation versus document-ordered
query evaluation for large document databases},
booktitle = {\sigir{21th}},
year = {1998},
pages = {343--344},
numpages = {2}
}
@Article{ kleinberg:authoritative:1999,
title = {Authoritative sources in a hyperlinked environment},
author = {Kleinberg, Jon M},
journal = {Journal of the ACM (JACM)},
volume = {46},
number = {5},
pages = {604--632},
year = {1999},
publisher = {ACM}
}
@InProceedings{ kulkarni:document:2010,
title = {Document allocation policies for selective searching of
distributed indexes},
author = {Kulkarni, Anagha and Callan, Jamie},
booktitle = {Proceedings of the 19th ACM international conference on
Information and knowledge management},
pages = {449--458},
year = {2010},
organization = {ACM}
}
@Article{ kulkarni:selective:2015,
title = {Selective search: Efficient and effective search of large
textual collections},
author = {Kulkarni, Anagha and Callan, Jamie},
journal = {ACM Transactions on Information Systems (TOIS)},
volume = {33},
number = {4},
pages = {17},
year = {2015},
publisher = {ACM}
}
@InProceedings{ kulkarni:shard:2012,
title = {Shard ranking and cutoff estimation for topically