-
Notifications
You must be signed in to change notification settings - Fork 1
/
refs.bib
2418 lines (2196 loc) · 187 KB
/
refs.bib
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
@inproceedings{bernstein_direct_2012,
location = {New York, {NY}, {USA}},
title = {Direct Answers for Search Queries in the Long Tail},
isbn = {978-1-4503-1015-4},
doi = {10.1145/2207676.2207710},
series = {{CHI} '12},
abstract = {Web search engines now offer more than ranked results. Queries on topics like weather, definitions, and movies may return inline results called answers that can resolve a searcher's information need without any additional interaction. Despite the usefulness of answers, they are limited to popular needs because each answer type is manually authored. To extend the reach of answers to thousands of new information needs, we introduce Tail Answers: a large collection of direct answers that are unpopular individually, but together address a large proportion of search traffic. These answers cover long-tail needs such as the average body temperature for a dog, substitutes for molasses, and the keyboard shortcut for a right-click. We introduce a combination of search log mining and paid crowdsourcing techniques to create Tail Answers. A user study with 361 participants suggests that Tail Answers significantly improved users' subjective ratings of search quality and their ability to solve needs without clicking through to a result. Our findings suggest that search engines can be extended to directly respond to a large new class of queries.},
pages = {237--246},
booktitle = {Proceedings of the {SIGCHI} Conference on Human Factors in Computing Systems},
publisher = {{ACM}},
author = {Bernstein, Michael S. and Teevan, Jaime and Dumais, Susan and Liebling, Daniel and Horvitz, Eric},
date = {2012},
keywords = {crowdsourcing, query log analysis, search user interfaces}
}
@inproceedings{teevan_slow_2013,
location = {New York, {NY}, {USA}},
title = {Slow Search: Information Retrieval Without Time Constraints},
isbn = {978-1-4503-2570-7},
series = {{HCIR} '13},
shorttitle = {Slow Search},
abstract = {Significant time and effort has been devoted to reducing the time between query receipt and search engine response, and for good reason. Research suggests that even slightly higher retrieval latency by Web search engines can lead to dramatic decreases in users' perceptions of result quality and engagement with the search results. While users have come to expect rapid responses from search engines, recent advances in our understanding of how people find information suggest that there are scenarios where a search engine could take significantly longer than a fraction of a second to return relevant content. This raises the important question: What would search look like if search engines were not constrained by existing expectations for speed? In this paper, we explore slow search, a class of search where traditional speed requirements are relaxed in favor of a high quality search experience. Via large-scale log analysis and user surveys, we examine how individuals value time when searching. We confirm that speed is important, but also show that there are many search situations where result quality is more important. This highlights intriguing opportunities for search systems to support new search experiences with high quality result content that takes time to identify. Slow search has the potential to change the search experience as we know it.},
pages = {1:1--1:10},
booktitle = {Proceedings of the Symposium on Human-Computer Interaction and Information Retrieval},
publisher = {{ACM}},
author = {Teevan, Jaime and Collins-Thompson, Kevyn and White, Ryen W. and Dumais, Susan T. and Kim, Yubin},
date = {2013},
keywords = {{citeDiss}, crowdsourcing, {INFORMATION} retrieval, Slow search, speed}
}
@report{kim_crowdsourcing_2013,
location = {Gaithersburg, Maryland},
title = {Crowdsourcing for Robustness in Web Search},
type = {Proceedings of {NIST} Special Publication: The Twenty-Second Text {REtrieval} Conference},
author = {Kim, Yubin and Kevyn, Collins-Thompson and Teevan, Jaime},
date = {2013-11},
keywords = {{citeDiss}}
}
@article{downie_music_2003,
title = {Music information retrieval},
volume = {37},
rights = {Copyright © 2002 American Society for Information Science and Technology},
issn = {1550-8382},
doi = {10.1002/aris.1440370108},
pages = {295--340},
number = {1},
journaltitle = {Annual Review of Information Science and Technology},
shortjournal = {Ann. Rev. Info. Sci. Tech.},
author = {Downie, J. Stephen},
date = {2003-01-01},
langid = {english},
}
@article{shera_librarians_1967,
title = {Librarians against Machines},
volume = {156},
issn = {0036-8075, 1095-9203},
doi = {10.1126/science.156.3776.746},
pages = {746--750},
number = {3776},
journaltitle = {Science},
shortjournal = {Science},
author = {Shera, Jesse H.},
date = {1967-05-12},
langid = {english},
pmid = {6022224}
}
@article{lintott_galaxy_2008,
title = {Galaxy Zoo : Morphologies derived from visual inspection of galaxies from the Sloan Digital Sky Survey},
shorttitle = {Galaxy Zoo},
abstract = {In order to understand the formation and subsequent evolution of galaxies one must first distinguish between the two main morphological classes of massive systems: spirals and early-type systems. This paper introduces a project, Galaxy Zoo, which provides visual morphological classifications for nearly one million galaxies, extracted from the Sloan Digital Sky Survey ({SDSS}). This achievement was made possible by inviting the general public to visually inspect and classify these galaxies via the internet. The project has obtained more than 40,000,000 individual classifications made by {\textasciitilde}100,000 participants. We discuss the motivation and strategy for this project, and detail how the classifications were performed and processed. We find that Galaxy Zoo results are consistent with those for subsets of {SDSS} galaxies classified by professional astronomers, thus demonstrating that our data provides a robust morphological catalogue. Obtaining morphologies by direct visual inspection avoids introducing biases associated with proxies for morphology such as colour, concentration or structual parameters. In addition, this catalogue can be used to directly compare {SDSS} morphologies with older data sets. The colour--magnitude diagrams for each morphological class are shown, and we illustrate how these distributions differ from those inferred using colour alone as a proxy for morphology.},
journaltitle = {0804.4483},
author = {Lintott, Chris J and Schawinski, Kevin and Slosar, Anze and Land, Kate and Bamford, Steven and Thomas, Daniel and Raddick, M. Jordan and Nichol, Robert C and Szalay, Alex and Andreescu, Dan and Murray, Phil and Berg, Jan van den},
date = {2008-04-29},
keywords = {Astrophysics},
file = {arXiv.org Snapshot:C\:\\Users\\Peter\\AppData\\Roaming\\Zotero\\Zotero\\Profiles\\zec9madg.default\\zotero\\storage\\V8EPT2QX\\0804.html:text/html}
}
@book{marshall_future_2000,
title = {The Future of Annotation in a Digital (Paper) World},
isbn = {0-87845-107-2},
abstract = {If order-making in the large is part of the institutional mission of libraries,
then order-making in the small—i.e., the informal work of annotating
and organizing materials collected in the service of particular dayto-
day work or pleasure—is part of the business of library patrons. This
discussion focuses on just such activities; activities that stem from readers'
engagements with texts, and possibly with each other, against a backdrop
of real-world settings and practices. I hesitate to call digital library patrons
users, since that is the word computer scientists tend to use to hide the
characteristics of what we hope is a diverse population.},
publisher = {Graduate School of Library and Information Science, University of Illinois at Urbana-Champaign.},
author = {Marshall, C.},
date = {2000},
langid = {english},
file = {Marshall_2000_The Future of Annotation in a Digital (Paper) World.pdf:C\:\\Users\\Peter\\Dropbox\\papers\\Graduate School of Library and Information Science, University of Illinois at Urbana-Champaign.2000\\Marshall_2000_The Future of Annotation in a Digital (Paper) World.pdf:application/pdf;Snapshot:C\:\\Users\\Peter\\AppData\\Roaming\\Zotero\\Zotero\\Profiles\\zec9madg.default\\zotero\\storage\\HBP3PHXR\\25539.html:text/html}
}
@inproceedings{li_exploring_2008,
location = {New York, {NY}, {USA}},
title = {Exploring question subjectivity prediction in community {QA}},
isbn = {978-1-60558-164-4},
doi = {10.1145/1390334.1390477},
series = {{SIGIR} '08},
abstract = {In this paper we begin to investigate how to automatically determine the subjectivity orientation of questions posted by real users in community question answering ({CQA}) portals. Subjective questions seek answers containing private states, such as personal opinion and experience. In contrast, objective questions request objective, verifiable information, often with support from reliable sources. Knowing the question orientation would be helpful not only for evaluating answers provided by users, but also for guiding the {CQA} engine to process questions more intelligently. Our experiments on Yahoo! Answers data show that our method exhibits promising performance.},
pages = {735--736},
booktitle = {Proceedings of the 31st annual international {ACM} {SIGIR} conference on Research and development in information retrieval},
publisher = {{ACM}},
author = {Li, Baoli and Liu, Yandong and Ram, Ashwin and Garcia, Ernest V. and Agichtein, Eugene},
date = {2008},
keywords = {question classification, subjectivity analysis},
file = {ACM Full Text PDF:C\:\\Users\\Peter\\AppData\\Roaming\\Zotero\\Zotero\\Profiles\\zec9madg.default\\zotero\\storage\\63GNH6SM\\Li et al. - 2008 - Exploring question subjectivity prediction in comm.pdf:application/pdf}
}
@article{linden_amazon.com_2003,
title = {Amazon.com recommendations: item-to-item collaborative filtering},
volume = {7},
issn = {1089-7801},
doi = {10.1109/MIC.2003.1167344},
shorttitle = {Amazon.com recommendations},
abstract = {Recommendation algorithms are best known for their use on e-commerce Web sites, where they use input about a customer's interests to generate a list of recommended items. Many applications use only the items that customers purchase and explicitly rate to represent their interests, but they can also use other attributes, including items viewed, demographic data, subject interests, and favorite artists. At Amazon.com, we use recommendation algorithms to personalize the online store for each customer. The store radically changes based on customer interests, showing programming titles to a software engineer and baby toys to a new mother. There are three common approaches to solving the recommendation problem: traditional collaborative filtering, cluster models, and search-based methods. Here, we compare these methods with our algorithm, which we call item-to-item collaborative filtering. Unlike traditional collaborative filtering, our algorithm's online computation scales independently of the number of customers and number of items in the product catalog. Our algorithm produces recommendations in real-time, scales to massive data sets, and generates high quality recommendations.},
pages = {76--80},
number = {1},
journaltitle = {{IEEE} Internet Computing},
author = {Linden, G. and Smith, B. and York, J.},
date = {2003-01},
keywords = {Advertising, Aggregates, Amazon.com recommendations, Clustering algorithms, cluster models, Collaboration, customer interests, demographic data, Demography, e-commerce, electronic commerce, Electronic mail, Filtering algorithms, information filtering, information filters, {INFORMATION} retrieval, item-to-item collaborative filtering, massive data sets, online store, Pediatrics, product catalog, real-time, real-time systems, recommendation algorithms, retail data processing, search-based methods, Web sites},
file = {IEEE Xplore Abstract Record:C\:\\Users\\Peter\\AppData\\Roaming\\Zotero\\Zotero\\Profiles\\zec9madg.default\\zotero\\storage\\73A5PWAX\\abs_all.html:text/html;IEEE Xplore Full Text PDF:C\:\\Users\\Peter\\AppData\\Roaming\\Zotero\\Zotero\\Profiles\\zec9madg.default\\zotero\\storage\\DDKCZWA6\\Linden et al. - 2003 - Amazon.com recommendations item-to-item collabora.pdf:application/pdf}
}
@inproceedings{vieweg_microblogging_2010,
title = {Microblogging during two natural hazards events: what twitter may contribute to situational awareness},
shorttitle = {Microblogging during two natural hazards events},
pages = {1079--1088},
booktitle = {Proceedings of the {SIGCHI} conference on human factors in computing systems},
publisher = {{ACM}},
author = {Vieweg, Sarah and Hughes, Amanda L. and Starbird, Kate and Palen, Leysia},
date = {2010},
file = {Snapshot:C\:\\Users\\Peter\\AppData\\Roaming\\Zotero\\Zotero\\Profiles\\zec9madg.default\\zotero\\storage\\RS2ITD4S\\citation.html:text/html;Vieweg et al_2010_Microblogging during two natural hazards events.pdf:C\:\\Users\\Peter\\Dropbox\\papers\\ACM2010\\Vieweg et al_2010_Microblogging during two natural hazards events.pdf:application/pdf}
}
@inproceedings{noll_web_2007,
location = {Berlin, Heidelberg},
title = {Web Search Personalization via Social Bookmarking and Tagging},
isbn = {3-540-76297-3 978-3-540-76297-3},
series = {{ISWC}'07/{ASWC}'07},
abstract = {In this paper, we present a new approach to web search personalization based on user collaboration and sharing of information about web documents. The proposed personalization technique separates data collection and user profiling from the information system whose contents and indexed documents are being searched for, i.e. the search engines, and uses social bookmarking and tagging to re-rank web search results. It is independent of the search engine being used, so users are free to choose the one they prefer, even if their favorite search engine does not natively support personalization. We show how to design and implement such a system in practice and investigate its feasibility and usefulness with large sets of real-word data and a user study.},
pages = {367--380},
booktitle = {Proceedings of the 6th International The Semantic Web and 2Nd Asian Conference on Asian Semantic Web Conference},
publisher = {Springer-Verlag},
author = {Noll, Michael G. and Meinel, Christoph},
date = {2007}
}
@inproceedings{bao_optimizing_2007,
location = {New York, {NY}, {USA}},
title = {Optimizing Web Search Using Social Annotations},
isbn = {978-1-59593-654-7},
doi = {10.1145/1242572.1242640},
series = {{WWW} '07},
abstract = {This paper explores the use of social annotations to improve websearch. Nowadays, many services, e.g. del.icio.us, have been developed for web users to organize and share their favorite webpages on line by using social annotations. We observe that the social annotations can benefit web search in two aspects: 1) the annotations are usually good summaries of corresponding webpages; 2) the count of annotations indicates the popularity of webpages. Two novel algorithms are proposed to incorporate the above information into page ranking: 1) {SocialSimRank} ({SSR})calculates the similarity between social annotations and webqueries; 2) {SocialPageRank} ({SPR}) captures the popularity of webpages. Preliminary experimental results show that {SSR} can find the latent semantic association between queries and annotations, while {SPR} successfully measures the quality (popularity) of a webpage from the web users' perspective. We further evaluate the proposed methods empirically with 50 manually constructed queries and 3000 auto-generated queries on a dataset crawledfrom delicious. Experiments show that both {SSR} and {SPRbenefit} web search significantly.},
pages = {501--510},
booktitle = {Proceedings of the 16th International Conference on World Wide Web},
publisher = {{ACM}},
author = {Bao, Shenghua and Xue, Guirong and Wu, Xiaoyuan and Yu, Yong and Fei, Ben and Su, Zhong},
date = {2007},
keywords = {evaluation, social annotation, social page rank, social similarity, web search}
}
@article{lerman_personalizing_2007,
title = {Personalizing image search results on flickr},
journaltitle = {Intelligent Information Personalization},
author = {Lerman, Kristina and Plangprasopchok, Anon and Wong, Chio},
date = {2007},
file = {Lerman et al_2007_Personalizing image search results on flickr.pdf:C\:\\Users\\Peter\\Dropbox\\papers\\Intelligent Information Personalization2007\\Lerman et al_2007_Personalizing image search results on flickr.pdf:application/pdf}
}
@article{furnas_vocabulary_1987,
title = {The vocabulary problem in human-system communication},
volume = {30},
issn = {00010782},
doi = {10.1145/32206.32212},
pages = {964--971},
number = {11},
journaltitle = {Communications of the {ACM}},
author = {Furnas, G. W. and Landauer, T. K. and Gomez, L. M. and Dumais, S. T.},
date = {1987-11-01},
file = {Furnas et al_1987_The vocabulary problem in human-system communication.pdf:C\:\\Users\\Peter\\Dropbox\\papers\\Communications of the ACM1987\\Furnas et al_1987_The vocabulary problem in human-system communication.pdf:application/pdf;Shibboleth Authentication Request:C\:\\Users\\Peter\\AppData\\Roaming\\Zotero\\Zotero\\Profiles\\zec9madg.default\\zotero\\storage\\MXI3X6UN\\login.html:text/html}
}
@article{shu_signing_2012,
title = {Signing at the beginning makes ethics salient and decreases dishonest self-reports in comparison to signing at the end},
volume = {109},
issn = {0027-8424, 1091-6490},
doi = {10.1073/pnas.1209746109},
abstract = {Many written forms required by businesses and governments rely on honest reporting. Proof of honest intent is typically provided through signature at the end of, e.g., tax returns or insurance policy forms. Still, people sometimes cheat to advance their financial self-interests—at great costs to society. We test an easy-to-implement method to discourage dishonesty: signing at the beginning rather than at the end of a self-report, thereby reversing the order of the current practice. Using laboratory and field experiments, we find that signing before—rather than after—the opportunity to cheat makes ethics salient when they are needed most and significantly reduces dishonesty.},
pages = {15197--15200},
number = {38},
journaltitle = {Proceedings of the National Academy of Sciences},
shortjournal = {{PNAS}},
author = {Shu, Lisa L. and Mazar, Nina and Gino, Francesca and Ariely, Dan and Bazerman, Max H.},
date = {2012-09-18},
langid = {english},
pmid = {22927408},
keywords = {fraud, morality, nudge, policy-making},
file = {Shu et al_2012_Signing at the beginning makes ethics salient and decreases dishonest.pdf:C\:\\Users\\Peter\\Dropbox\\papers\\Proceedings of the National Academy of Sciences2012\\Shu et al_2012_Signing at the beginning makes ethics salient and decreases dishonest.pdf:application/pdf;Snapshot:C\:\\Users\\Peter\\AppData\\Roaming\\Zotero\\Zotero\\Profiles\\zec9madg.default\\zotero\\storage\\I69UWKGU\\15197.html:text/html}
}
@book{csikszentmihalyi_flow_1991,
title = {Flow: The psychology of optimal experience},
volume = {41},
shorttitle = {Flow},
publisher = {{HarperPerennial} New York},
author = {Csikszentmihalyi, Mihaly},
date = {1991}
}
@inproceedings{kazai_crowdsourcing_2011,
location = {New York, {NY}, {USA}},
title = {Crowdsourcing for Book Search Evaluation: Impact of Hit Design on Comparative System Ranking},
isbn = {978-1-4503-0757-4},
doi = {10.1145/2009916.2009947},
series = {{SIGIR} '11},
shorttitle = {Crowdsourcing for Book Search Evaluation},
abstract = {The evaluation of information retrieval ({IR}) systems over special collections, such as large book repositories, is out of reach of traditional methods that rely upon editorial relevance judgments. Increasingly, the use of crowdsourcing to collect relevance labels has been regarded as a viable alternative that scales with modest costs. However, crowdsourcing suffers from undesirable worker practices and low quality contributions. In this paper we investigate the design and implementation of effective crowdsourcing tasks in the context of book search evaluation. We observe the impact of aspects of the Human Intelligence Task ({HIT}) design on the quality of relevance labels provided by the crowd. We assess the output in terms of label agreement with a gold standard data set and observe the effect of the crowdsourced relevance judgments on the resulting system rankings. This enables us to observe the effect of crowdsourcing on the entire {IR} evaluation process. Using the test set and experimental runs from the {INEX} 2010 Book Track, we find that varying the {HIT} design, and the pooling and document ordering strategies leads to considerable differences in agreement with the gold set labels. We then observe the impact of the crowdsourced relevance label sets on the relative system rankings using four {IR} performance metrics. System rankings based on {MAP} and Bpref remain less affected by different label sets while the Precision@10 and {nDCG}@10 lead to dramatically different system rankings, especially for labels acquired from {HITs} with weaker quality controls. Overall, we find that crowdsourcing can be an effective tool for the evaluation of {IR} systems, provided that care is taken when designing the {HITs}.},
pages = {205--214},
booktitle = {Proceedings of the 34th International {ACM} {SIGIR} Conference on Research and Development in Information Retrieval},
publisher = {{ACM}},
author = {Kazai, Gabriella and Kamps, Jaap and Koolen, Marijn and Milic-Frayling, Natasa},
date = {2011},
keywords = {book search, {citeDiss}, crowdsourcing quality, prove it},
file = {Kazai et al_2011_Crowdsourcing for Book Search Evaluation.pdf:C\:\\Users\\Peter\\Dropbox\\papers\\ACM2011\\Kazai et al_2011_Crowdsourcing for Book Search Evaluation.pdf:application/pdf}
}
@inproceedings{zhang_human_2012,
location = {New York, {NY}, {USA}},
title = {Human computation tasks with global constraints},
isbn = {978-1-4503-1015-4},
doi = {10.1145/2207676.2207708},
series = {{CHI} '12},
abstract = {An important class of tasks that are underexplored in current human computation systems are complex tasks with global constraints. One example of such a task is itinerary planning, where solutions consist of a sequence of activities that meet requirements specified by the requester. In this paper, we focus on the crowdsourcing of such plans as a case study of constraint-based human computation tasks and introduce a collaborative planning system called Mobi that illustrates a novel crowdware paradigm. Mobi presents a single interface that enables crowd participants to view the current solution context and make appropriate contributions based on current needs. We conduct experiments that explain how Mobi enables a crowd to effectively and collaboratively resolve global constraints, and discuss how the design principles behind Mobi can more generally facilitate a crowd to tackle problems involving global constraints.},
pages = {217--226},
booktitle = {Proceedings of the {SIGCHI} Conference on Human Factors in Computing Systems},
publisher = {{ACM}},
author = {Zhang, Haoqi and Law, Edith and Miller, Rob and Gajos, Krzysztof and Parkes, David and Horvitz, Eric},
date = {2012},
keywords = {collaborative planning, crowdware, groupware, human computation, mixed-initiative interaction},
file = {ACM Full Text PDF:C\:\\Users\\Peter\\AppData\\Roaming\\Zotero\\Zotero\\Profiles\\zec9madg.default\\zotero\\storage\\U4FIIPZD\\Zhang et al. - 2012 - Human computation tasks with global constraints.pdf:application/pdf}
}
@article{marmorstein_value_1992,
title = {The Value of Time Spent in Price-Comparison Shopping: Survey and Experimental Evidence},
volume = {19},
rights = {Copyright © 1992 Journal of Consumer Research, Inc.},
issn = {0093-5301},
shorttitle = {The Value of Time Spent in Price-Comparison Shopping},
abstract = {The value that consumers place on time spent in price-comparison shopping is central to the economics of information theory and models of consumers' search behavior. Yet few empirical studies have examined consumers' subjective value of time. Building on Gary Becker's work, this article presents two tests of a model of the subjective value of time. In an effort to explain consumers' subjective value of time while they are price-comparison shopping, the model introduces perceived enjoyment of shopping as a new explanatory variable. The findings reveal that respondents incorporate both wage rates and perceived enjoyment of price-comparison shopping into their subjective value of time.},
pages = {52--61},
number = {1},
journaltitle = {Journal of Consumer Research},
shortjournal = {Journal of Consumer Research},
author = {Marmorstein, Howard and Grewal, Dhruv and Fishe, Raymond P. H.},
date = {1992-06-01},
keywords = {{citeDiss}, temp},
file = {Marmorstein et al_1992_The Value of Time Spent in Price-Comparison Shopping.pdf:C\:\\Users\\Peter\\Dropbox\\papers\\Marmorstein et al_1992_The Value of Time Spent in Price-Comparison Shopping.pdf:application/pdf}
}
@article{konstan_grouplens_1997,
title = {{GroupLens}: Applying Collaborative Filtering to Usenet News},
volume = {40},
issn = {0001-0782},
doi = {10.1145/245108.245126},
shorttitle = {{GroupLens}},
pages = {77--87},
number = {3},
journaltitle = {Commun. {ACM}},
author = {Konstan, Joseph A. and Miller, Bradley N. and Maltz, David and Herlocker, Jonathan L. and Gordon, Lee R. and Riedl, John},
date = {1997-03},
keywords = {{citeDiss}, temp},
file = {ACM Full Text PDF:C\:\\Users\\Peter\\AppData\\Roaming\\Zotero\\Zotero\\Profiles\\zec9madg.default\\zotero\\storage\\K8H65RMZ\\Konstan et al. - 1997 - GroupLens Applying Collaborative Filtering to Use.pdf:application/pdf;ACM Full Text PDF:C\:\\Users\\Peter\\AppData\\Roaming\\Zotero\\Zotero\\Profiles\\zec9madg.default\\zotero\\storage\\W3J2CFHT\\Konstan et al. - 1997 - GroupLens Applying Collaborative Filtering to Use.pdf:application/pdf}
}
@article{gursoy_integrative_2004,
title = {{AN} {INTEGRATIVE} {MODEL} {OF} {TOURISTS}’ {INFORMATION} {SEARCH} {BEHAVIOR}},
volume = {31},
issn = {0160-7383},
doi = {10.1016/j.annals.2003.12.004},
abstract = {This article develops a comprehensive theoretical model that integrates the psychological/motivational, economics, and processing approaches into a cohesive whole for understanding tourists’ information seeking behavior. The model proposes that for immediate pre-purchase information needs, a consumer is likely to utilize either internal or external sources, or both. The search is likely to be influenced directly by the perceived internal and external costs, and the level of involvement required. Familiarity and expertise, learning and previous visits indirectly influence the search. Their influences are mediated by familiarity and expertise with the destination, which are, in turn, mediated by external and internal costs. Twenty-one propositions are developed for future testing.},
pages = {353--373},
number = {2},
journaltitle = {Annals of Tourism Research},
shortjournal = {Annals of Tourism Research},
author = {Gursoy, Dogan and {McCleary}, Ken W.},
date = {2004-04},
keywords = {-clérecherche de renseignements, apprentissage, {citeDiss}, connaissances, engagement, expertise, familiarité, familiarity, information search, involvement, learning, temp},
file = {Gursoy_McCleary_2004_AN INTEGRATIVE MODEL OF TOURISTS’ INFORMATION SEARCH BEHAVIOR.pdf:C\:\\Users\\Peter\\Dropbox\\papers\\Gursoy_McCleary_2004_AN INTEGRATIVE MODEL OF TOURISTS’ INFORMATION SEARCH BEHAVIOR.pdf:application/pdf;ScienceDirect Snapshot:C\:\\Users\\Peter\\AppData\\Roaming\\Zotero\\Zotero\\Profiles\\zec9madg.default\\zotero\\storage\\W7FNCH24\\S0160738303001397.html:text/html}
}
@inproceedings{dellarocas_what_2006,
title = {What motivates consumers to review a product online? A study of the product-specific antecedents of online movie reviews},
shorttitle = {What motivates consumers to review a product online?},
booktitle = {{WISE}},
author = {Dellarocas, Chrysanthos and Narayan, Ritu},
date = {2006},
keywords = {{citeDiss}, jdistribution, j-distribution, temp},
file = {Dellarocas_Narayan_2006_What motivates consumers to review a product online.pdf:C\:\\Users\\Peter\\Dropbox\\papers\\2006\\Dellarocas_Narayan_2006_What motivates consumers to review a product online.pdf:application/pdf}
}
@inproceedings{hu_can_2006,
location = {New York, {NY}, {USA}},
title = {Can Online Reviews Reveal a Product's True Quality?: Empirical Findings and Analytical Modeling of Online Word-of-mouth Communication},
isbn = {1-59593-236-4},
doi = {10.1145/1134707.1134743},
series = {{EC} '06},
shorttitle = {Can Online Reviews Reveal a Product's True Quality?},
abstract = {As a digital version of word-of-mouth, online review has become a major information source for consumers and has very important implications for a wide range of management activities. While some researchers focus their studies on the impact of online product review on sales, an important assumption remains unexamined, that is, can online product review reveal the true quality of the product? To test the validity of this key assumption, this paper first empirically tests the underlying distribution of online reviews with data from Amazon. The results show that 53\% of the products have a bimodal and non-normal distribution. For these products, the average score does not necessarily reveal the product's true quality and may provide misleading recommendations. Then this paper derives an analytical model to explain when the mean can serve as a valid representation of a product's true quality, and discusses its implication on marketing practices.},
pages = {324--330},
booktitle = {Proceedings of the 7th {ACM} Conference on Electronic Commerce},
publisher = {{ACM}},
author = {Hu, Nan and Pavlou, Paul A. and Zhang, Jennifer},
date = {2006},
keywords = {bi-modal distribution, {citeDiss}, online reviews, temp, Word-of-mouth},
file = {Hu et al_2006_Can Online Reviews Reveal a Product's True Quality.pdf:C\:\\Users\\Peter\\Dropbox\\papers\\ACM2006\\Hu et al_2006_Can Online Reviews Reveal a Product's True Quality.pdf:application/pdf}
}
@inproceedings{krishnan_who_2008,
location = {New York, {NY}, {USA}},
title = {Who Predicts Better?: Results from an Online Study Comparing Humans and an Online Recommender System},
isbn = {978-1-60558-093-7},
doi = {10.1145/1454008.1454042},
series = {{RecSys} '08},
shorttitle = {Who Predicts Better?},
abstract = {Algorithmic recommender systems attempt to predict which items a target user will like based on information about the user's prior preferences and the preferences of a larger community. After more than a decade of widespread use, researchers and system users still debate whether such "impersonal" recommender systems actually perform as well as human recommenders. We compare the performance of {MovieLens} algorithmic predictions with the recommendations made, based on the same user profiles, by active {MovieLens} users. We found that algorithmic collaborative filtering outperformed humans on average, though some individuals outperformed the system substantially and humans on average outperformed the system on certain prediction tasks.},
pages = {211--218},
booktitle = {Proceedings of the 2008 {ACM} Conference on Recommender Systems},
publisher = {{ACM}},
author = {Krishnan, Vinod and Narayanashetty, Pradeep Kumar and Nathan, Mukesh and Davies, Richard T. and Konstan, Joseph A.},
date = {2008},
keywords = {{citeDiss}, human recommenders, mae, movielens, predictions, recommender evaluation, recommender systems, temp},
file = {ACM Full Text PDF:C\:\\Users\\Peter\\AppData\\Roaming\\Zotero\\Zotero\\Profiles\\zec9madg.default\\zotero\\storage\\ZK2UTR2K\\Krishnan et al. - 2008 - Who Predicts Better Results from an Online Study.pdf:application/pdf}
}
@article{daugherty_exploring_2008,
title = {Exploring Consumer Motivations for Creating User-Generated Content},
volume = {8},
issn = {null},
doi = {10.1080/15252019.2008.10722139},
abstract = {The advent of Web 2.0 technologies has enabled the efficient creation and distribution of user-generated content ({UGC}), resulting in vast changes in the online media landscape. For instance, the proliferation of {UGC} has made a strong impact on consumers, media suppliers, and marketing professionals while necessitating research in order to understand both the short and long-term implications of this media content. This exploratory study (n = 325) seeks to investigate consumer consumption and creation of {UGC} and the attitudinal factors that contribute to these actions. The data confirm the established relationship between attitude and behavior and indicate attitude serves as a mediating factor between the use and creation of {UGC}. With regard to the creation of {UGC}, the ego-defensive and social functions of attitude were found to have the most explanatory power.},
pages = {16--25},
number = {2},
journaltitle = {Journal of Interactive Advertising},
author = {Daugherty, Terry and Eastin, Matthew S. and Bright, Laura},
date = {2008-03-01},
keywords = {{citeDiss}, temp},
file = {Full Text PDF:C\:\\Users\\Peter\\AppData\\Roaming\\Zotero\\Zotero\\Profiles\\zec9madg.default\\zotero\\storage\\PUSBFA6T\\Daugherty et al. - 2008 - Exploring Consumer Motivations for Creating User-G.pdf:application/pdf;Snapshot:C\:\\Users\\Peter\\AppData\\Roaming\\Zotero\\Zotero\\Profiles\\zec9madg.default\\zotero\\storage\\QDFK6447\\Daugherty et al. - 2008 - Exploring Consumer Motivations for Creating User-G.html:text/html}
}
@movie{pugh_star_2009,
title = {Star Wars Uncut: Director's Cut},
url = {www.starwarsuncut.com},
author = {Pugh, Casey},
date = {2009},
keywords = {{citeDiss}, temp}
}
@inproceedings{zhang_enhancing_2009,
location = {New York, {NY}, {USA}},
title = {Enhancing Information Scent: Identifying and Recommending Quality Tags},
isbn = {978-1-60558-500-0},
doi = {10.1145/1531674.1531676},
series = {{GROUP} '09},
shorttitle = {Enhancing Information Scent},
abstract = {We describe a scenario of tag use and an empirical study of tags as socio-cognitive artifacts providing information scent. We articulated a three-step use scenario of tags, and used it to conceptualize tag "quality" as determined by use. We designed and conducted a user study to explore what attributes of tags and taggers predict the user-rated "quality" of tags. We found that frequency best predicted tag quality, while information entropy provided further refinement. We found that people rated our identified quality tags as higher in quality than general tags. But these identified quality tags were not perceived as better than self-generated tags. We derived a regression model for tag quality and discussed implications for social computing.},
pages = {1--10},
booktitle = {Proceedings of the {ACM} 2009 International Conference on Supporting Group Work},
publisher = {{ACM}},
author = {Zhang, Shaoke and Farooq, Umer and Carroll, John M.},
date = {2009},
keywords = {{citeDiss}, quality tags, sense-making, social bookmarking, temp},
file = {Zhang et al_2009_Enhancing Information Scent.pdf:C\:\\Users\\Peter\\Dropbox\\papers\\ACM2009\\Zhang et al_2009_Enhancing Information Scent.pdf:application/pdf}
}
@inproceedings{bernstein_crowds_2011,
location = {New York, {NY}, {USA}},
title = {Crowds in two seconds: enabling realtime crowd-powered interfaces},
isbn = {978-1-4503-0716-1},
doi = {10.1145/2047196.2047201},
series = {{UIST} '11},
shorttitle = {Crowds in two seconds},
abstract = {Interactive systems must respond to user input within seconds. Therefore, to create realtime crowd-powered interfaces, we need to dramatically lower crowd latency. In this paper, we introduce the use of synchronous crowds for on-demand, realtime crowdsourcing. With synchronous crowds, systems can dynamically adapt tasks by leveraging the fact that workers are present at the same time. We develop techniques that recruit synchronous crowds in two seconds and use them to execute complex search tasks in ten seconds. The first technique, the retainer model, pays workers a small wage to wait and respond quickly when asked. We offer empirically derived guidelines for a retainer system that is low-cost and produces on-demand crowds in two seconds. Our second technique, rapid refinement, observes early signs of agreement in synchronous crowds and dynamically narrows the search space to focus on promising directions. This approach produces results that, on average, are of more reliable quality and arrive faster than the fastest crowd member working alone. To explore benefits and limitations of these techniques for interaction, we present three applications: Adrenaline, a crowd-powered camera where workers quickly filter a short video down to the best single moment for a photo; and Puppeteer and A{\textbar}B, which examine creative generation tasks, communication with workers, and low-latency voting.},
pages = {33--42},
booktitle = {Proceedings of the 24th annual {ACM} symposium on User interface software and technology},
publisher = {{ACM}},
author = {Bernstein, Michael S. and Brandt, Joel and Miller, Robert C. and Karger, David R.},
date = {2011},
keywords = {{citeDiss}, crowdsourcing, human computation, temp}
}
@inproceedings{tamuz_adaptively_2011,
title = {Adaptively Learning the Crowd Kernel},
shorttitle = {Proc. {ICML} 2011},
booktitle = {Proceedings of the International Conference on Machine Learning},
author = {Tamuz, Omer and Liu, Ce and Belongie, Serge and Shamir, Ohad and Kalai, Adam Tauman},
date = {2011},
keywords = {{citeDiss}, temp},
file = {[PDF] from icml-2011.org:C\:\\Users\\Peter\\AppData\\Roaming\\Zotero\\Zotero\\Profiles\\zec9madg.default\\zotero\\storage\\PPCZ87MR\\Tamuz et al. - 2011 - Adaptively Learning the Crowd Kernel.pdf:application/pdf}
}
@article{radinsky_learning_2012,
title = {Learning to Predict from Textual Data},
volume = {45},
issn = {1076-9757},
abstract = {Given a current news event, we tackle the problem of generating plausible predictions of future events it might cause. We present a new methodology for modeling and predicting such future news events using machine learning and data mining techniques. Our Pundit algorithm generalizes examples of causality pairs to infer a causality predictor. To obtain precisely labeled causality examples, we mine 150 years of news articles and apply semantic natural language modeling techniques to headlines containing certain predefined causality patterns. For generalization, the model uses a vast number of world knowledge ontologies. Empirical evaluation on real news articles shows that our Pundit algorithm performs as well as non-expert humans.},
pages = {641--684},
number = {1},
journaltitle = {J. Artif. Int. Res.},
author = {Radinsky, Kira and Davidovich, Sagie and Markovitch, Shaul},
date = {2012-09},
keywords = {{citeDiss}, temp}
}
@inproceedings{alonso_are_2013,
location = {New York, {NY}, {USA}},
title = {Are Some Tweets More Interesting Than Others? \#{HardQuestion}},
isbn = {978-1-4503-2570-7},
doi = {10.1145/2528394.2528396},
series = {{HCIR} '13},
shorttitle = {Are Some Tweets More Interesting Than Others?},
abstract = {Twitter has evolved into a significant communication nexus, coupling personal and highly contextual utterances with local news, memes, celebrity gossip, headlines, and other microblogging subgenres. If we take Twitter as a large and varied dynamic collection, how can we predict which tweets will be interesting to a broad audience in advance of lagging social indicators of interest such as retweets? The telegraphic form of tweets, coupled with the subjective notion of interestingness, makes it difficult for human judges to agree on which tweets are indeed interesting. In this paper, we address two questions: Can we develop a reliable strategy that results in high-quality labels for a collection of tweets, and can we use this labeled collection to predict a tweet's interestingness? To answer the first question, we performed a series of studies using crowdsourcing to reach a diverse set of workers who served as a proxy for an audience with variable interests and perspectives. This method allowed us to explore different labeling strategies, including varying the judges, the labels they applied, the datasets, and other aspects of the task. To address the second question, we used crowdsourcing to assemble a set of tweets rated as interesting or not; we scored these tweets using textual and contextual features; and we used these scores as inputs to a binary classifier. We were able to achieve moderate agreement (κ = 0.52) between the best classifier and the human assessments, a figure which reflects the challenges of the judgment task.},
pages = {2:1--2:10},
booktitle = {Proceedings of the Symposium on Human-Computer Interaction and Information Retrieval},
publisher = {{ACM}},
author = {Alonso, Omar and Marshall, Catherine C. and Najork, Marc},
date = {2013},
keywords = {{citeDiss}, crowdsourcing, interestingness, label quality, temp, twitter},
file = {ACM Full Text PDF:C\:\\Users\\Peter\\AppData\\Roaming\\Zotero\\Zotero\\Profiles\\zec9madg.default\\zotero\\storage\\U8KQZV5M\\Alonso et al. - 2013 - Are Some Tweets More Interesting Than Others #Har.pdf:application/pdf}
}
@inproceedings{kokkalis_emailvalet_2013,
location = {New York, {NY}, {USA}},
title = {{EmailValet}: managing email overload through private, accountable crowdsourcing},
isbn = {978-1-4503-1331-5},
doi = {10.1145/2441776.2441922},
series = {{CSCW} '13},
shorttitle = {{EmailValet}},
abstract = {This paper introduces privacy and accountability techniques for crowd-powered systems. We focus on email task management: tasks are an implicit part of every inbox, but the overwhelming volume of incoming email can bury important requests. We present {EmailValet}, an email client that recruits remote assistants from an expert crowdsourcing marketplace. By annotating each email with its implicit tasks, {EmailValet}'s assistants create a task list that is automatically populated from emails in the user's inbox. The system is an example of a valet approach to crowdsourcing, which aims for parsimony and transparency in access con-trol for the crowd. To maintain privacy, users specify rules that define a sliding-window subset of their inbox that they are willing to share with assistants. To support accountability, {EmailValet} displays the actions that the assistant has taken on each email. In a weeklong field study, participants completed twice as many of their email-based tasks when they had access to crowdsourced assistants, and they became increasingly comfortable sharing their inbox with assistants over time.},
pages = {1291--1300},
booktitle = {Proceedings of the 2013 conference on Computer supported cooperative work},
publisher = {{ACM}},
author = {Kokkalis, Nicolas and Köhn, Thomas and Pfeiffer, Carl and Chornyi, Dima and Bernstein, Michael S. and Klemmer, Scott R.},
date = {2013},
keywords = {access control, {citeDiss}, crowdsourcing, email overload, human assistants, task management, temp}
}
@inproceedings{rzeszotarski_inserting_2013,
title = {Inserting Micro-Breaks into Crowdsourcing Workflows},
rights = {Authors who submit to this conference agree to the following terms: a) \ Authors retain copyright over their work, while allowing the conference to place this unpublished work under a Creative Commons Attribution License , which allows others to freely access, use, and share the work, with an acknowledgement of the work's authorship and its initial presentation at this conference. b) \ Authors are able to waive the terms of the {CC} license and enter into separate, additional contractual arrangements for the non-exclusive distribution and subsequent publication of this work (e.g., publish a revised version in a journal, post it to an institutional repository or publish it in a book), with an acknowledgement of its initial presentation at this conference. c) \ In addition, authors are encouraged to post and share their work online (e.g., in institutional repositories or on their website) at any point before and after the conference.},
abstract = {Participants in human computation workflows may become fatigued or get bored over long, interminable working hours. This leads to a slump of motivation and morale, which in the long run causes reductions in both productivity and work quality. In this paper we propose an initial investigation into possible ways to alleviate worker fatigue and boredom by employing micro-breaks that provide timely relax to workers during long sequences of tasks. We experimentally test micro-breaks on Amazon’s Mechanical Turk, showing that micro-breaks can significantly improve worker retention rate as task batches reach hours in length, and appear to increase overall worker engagement and commitment to their work.},
eventtitle = {First {AAAI} Conference on Human Computation and Crowdsourcing},
booktitle = {First {AAAI} Conference on Human Computation and Crowdsourcing},
author = {Rzeszotarski, Jeffrey M. and Chi, Ed and Paritosh, Praveen and Dai, Peng},
date = {2013-03-11},
langid = {english},
keywords = {{citeDiss}, temp},
file = {Snapshot:C\:\\Users\\Peter\\AppData\\Roaming\\Zotero\\Zotero\\Profiles\\zec9madg.default\\zotero\\storage\\PWNUVD5S\\7544.html:text/html}
}
@article{kiritchenko_sentiment_2014,
title = {Sentiment Analysis of Short Informal Texts},
volume = {50},
issn = {1076-9757},
abstract = {We describe a state-of-the-art sentiment analysis system that detects (a) the sentiment of short informal textual messages such as tweets and {SMS} (message-level task) and (b) the sentiment of a word or a phrase within a message (term-level task). The system is based on a supervised statistical text classification approach leveraging a variety of surface-form, semantic, and sentiment features. The sentiment features are primarily derived from novel high-coverage tweet-specific sentiment lexicons. These lexicons are automatically generated from tweets with sentiment-word hashtags and from tweets with emoticons. To adequately capture the sentiment of words in negated contexts, a separate sentiment lexicon is generated for negated words. The system ranked first in the {SemEval}-2013 shared task 'Sentiment Analysis in Twitter' (Task 2), obtaining an F-score of 69.02 in the message-level task and 88.93 in the term-level task. Post-competition improvements boost the performance to an F-score of 70.45 (message-level task) and 89.50 (term-level task). The system also obtains state-of-the-art performance on two additional datasets: the {SemEval}-2013 {SMS} test set and a corpus of movie review excerpts. The ablation experiments demonstrate that the use of the automatically generated lexicons results in performance gains of up to 6.5 absolute percentage points.},
pages = {723--762},
number = {1},
journaltitle = {J. Artif. Int. Res.},
author = {Kiritchenko, Svetlana and Zhu, Xiaodan and Mohammad, Saif M.},
date = {2014-05},
keywords = {{citeDiss}, temp}
}
@inproceedings{organisciak_crowd_2014,
location = {Pittsburgh, {USA}},
title = {A Crowd of Your Own: Crowdsourcing for On-Demand Personalization},
series = {{HCOMP} 2014},
booktitle = {Proceedings of the Second {AAAI} Conference on Human Computation \& Crowdsourcing},
publisher = {{AAAI}},
author = {Organisciak, Peter and Teevan, Jaime and Dumais, Susan T. and Miller, Robert C. and Kalai, Adam Tauman},
date = {2014-11-02},
keywords = {{citeDiss}, temp}
}
@inproceedings{organisciak_matching_2015,
location = {Buenos Aires, Argentina},
title = {Matching and Grokking: Approaches to Personalized Crowdsourcing},
series = {{IJCAI} '15 (Best Papers from Sister Conferences track)},
eventtitle = {International Joint Conferences on Artificial Intelligence},
publisher = {{AAAI}},
author = {Organisciak, Peter and Teevan, Jaime and Dumais, Susan and Miller, Robert C. and Kalai, Adam Tauman},
date = {2015-07},
keywords = {{citeDiss}, temp}
}
@online{chen_mechanical_2012,
title = {Mechanical Turk Best Practices},
url = {Mechanical Turk Best Practices},
type = {Clockwork Raven Wiki},
author = {Chen, Edwin},
date = {2012-10-08},
keywords = {{citeDissProp}}
}
@online{chen_making_2012,
title = {Making the Most of Mechanical Turk: Tips and Best Practices},
url = {http://blog.echen.me/2012/04/25/making-the-most-of-mechanical-turk-tips-and-best-practices/},
type = {Blog},
author = {Chen, Edwin},
date = {2012-04-25},
keywords = {{citeDissProp}}
}
@inproceedings{harris_youre_2011,
title = {You’re hired! an examination of crowdsourcing incentive models in human resource tasks},
eventtitle = {{CSDM}},
pages = {15--18},
booktitle = {Proceedings of the Workshop on Crowdsourcing for Search and Data Mining ({CSDM}) at the Fourth {ACM} International Conference on Web Search and Data Mining ({WSDM})},
author = {Harris, Christopher},
date = {2011},
keywords = {{citeDiss}},
file = {Harris_2011_You’re hired.pdf:C\:\\Users\\Peter\\Dropbox\\papers\\2011\\Harris_2011_You’re hired.pdf:application/pdf}
}
@article{eisenberg_measuring_1988,
title = {Measuring relevance judgments},
volume = {24},
issn = {0306-4573},
doi = {10.1016/0306-4573(88)90042-8},
abstract = {Accurate, reliable measurement of relevance is fundamental to research in information science and to the design, development, and evaluation of information systems. This article describes a study focusing on the measurement of relevance and the application of magnitude estimation, an open-ended scaling technique developed in the field of sensory psychophysics, to the task of measuring relevance judgments. The study found that magnitude estimation is highly appropriate for the measurement of relevance judgments and less influenced by potential biases than commonly used category rating scaling procedures. One biasing factor—a range context effect—was found for both magnitude estimation and category rating scales.},
pages = {373--389},
number = {4},
journaltitle = {Information Processing \& Management},
shortjournal = {Information Processing \& Management},
author = {Eisenberg, Michael B.},
date = {1988},
file = {ScienceDirect Snapshot:C\:\\Users\\Peter\\AppData\\Roaming\\Zotero\\Zotero\\Profiles\\zec9madg.default\\zotero\\storage\\2NQ88B5S\\0306457388900428.html:text/html}
}
@inproceedings{urbano_crowdsourcing_2010,
title = {Crowdsourcing preference judgments for evaluation of music similarity tasks},
pages = {9--16},
booktitle = {{ACM} {SIGIR} workshop on crowdsourcing for search evaluation},
author = {Urbano, Julián and Morato, Jorge and Marrero, Mónica and Martín, Diego},
date = {2010},
file = {[PDF] from monica-marrero.com:C\:\\Users\\Peter\\AppData\\Roaming\\Zotero\\Zotero\\Profiles\\zec9madg.default\\zotero\\storage\\GBD2QXUR\\Urbano et al. - 2010 - Crowdsourcing preference judgments for evaluation .pdf:application/pdf}
}
@article{typke_ground_2005,
title = {A Ground Truth For Half A Million Musical Incipits.},
volume = {3},
pages = {34--38},
number = {1},
journaltitle = {{JDIM}},
author = {Typke, Rainer and den Hoed, Marc and de Nooijer, Justin and Wiering, Frans and Veltkamp, Remco C.},
date = {2005},
file = {[PDF] from computingscience.nl:C\:\\Users\\Peter\\AppData\\Roaming\\Zotero\\Zotero\\Profiles\\zec9madg.default\\zotero\\storage\\DSMC9DKA\\Typke et al. - 2005 - A Ground Truth For Half A Million Musical Incipits.pdf:application/pdf}
}
@online{hiatt_role_2013,
title = {The Role of Familiarity, Priming and Perception in Similarity Judgments},
author = {Hiatt, Laura and Trafton, J. and Trafton, J. and Trafton, J.},
date = {2013},
file = {The Role of Familiarity, Priming and Perception in Similarity Judgments | Laboratory for Autonomous Systems Research:C\:\\Users\\Peter\\AppData\\Roaming\\Zotero\\Zotero\\Profiles\\zec9madg.default\\zotero\\storage\\FVZ5BVXV\\role-familiarity-priming-and-perception-similarity-judgments.html:text/html}
}
@article{golder_usage_2006,
title = {Usage patterns of collaborative tagging systems},
volume = {32},
doi = {10.1177/0165551506062337},
pages = {198 --208},
number = {2},
journaltitle = {Journal of Information Science},
author = {Golder, Scott A. and Huberman, Bernardo A.},
date = {2006-04-01},
keywords = {bookmarks, {citeDiss}, collaborative tagging, Del.icio.us, folksonomy, {ICcited}, sharing, social book-marking, social media, sorted, tagging, web},
}
@incollection{downie_music_2010,
title = {The music information retrieval evaluation exchange: Some observations and insights},
pages = {93--115},
booktitle = {Advances in music information retrieval},
publisher = {Springer Berlin / Heidelberg},
author = {Downie, J. Stephen},
date = {2010}
}
@inproceedings{organisciak_iterative_2012,
location = {Washington {DC}, {USA}},
title = {An Iterative Reliability Measure for Semi-anonymous Annotators},
eventtitle = {Joint Conference on Digital Libraries},
author = {Organisciak, Peter},
date = {2012-06},
keywords = {{hcirCITE}}
}
@inproceedings{wang_managing_2011,
location = {Utah},
title = {Managing Crowdsourcing Workers},
abstract = {The emergence of online crowdsourcing services such as Amazon Mechanical Turk, presents us huge opportunities to distribute micro-tasks at an unprecedented rate and scale. Unfortunately, the high verification cost and the unstable employment relationship give rise to opportunistic behaviors of workers, which in turn exposes the requesters to quality risks. Currently, most requesters rely on redundancy to identify the correct answers. However, existing techniques cannot separate the true (unrecoverable) error rates from the (recoverable) biases that some workers exhibit, which would lead to incorrect assessment of worker quality. Furthermore, massive redundancy is expensive, increasing significantly the cost of crowdsourced solutions. In this paper, we present an algorithm that can easily separate the true error rates from the biases. Also, we describe how to seamlessly integrate the existence of “gold” data for learning the quality of workers. Next, we bring up an approach for actively testing worker quality in order to quicky identify spammers or malicious workers. Finally, we present experimental results to demonstrate the performance of our proposed algorithm.},
eventtitle = {Winter Conference on Business Intelligence},
author = {Wang, Jing and Ipeirotis, Panagiotis G., and Provost, Foster},
date = {2011-03},
keywords = {bad workers, {hcirCITE}, {hcirMidtermCITE}, opportunistic workers, reliability, trustworthiness, turk}
}
@inproceedings{organisciak_design_2015,
location = {Newport Beach, {CA}},
title = {Design Facets of Crowdsourcing},
series = {{iConference} '15},
booktitle = {Proceedings of the 2015 {iConference}},
author = {Organisciak, Peter and Twidale, Michael B.},
date = {2015-03-24}
}
@book{mcgonigal_reality_2011,
edition = {Reprint},
title = {Reality Is Broken: Why Games Make Us Better and How They Can Change the World},
isbn = {0-14-312061-1},
shorttitle = {Reality Is Broken},
pagetotal = {416},
publisher = {Penguin Books},
author = {{McGonigal}, Jane},
date = {2011-12-27}
}
@article{swanson_snapshot_2015,
title = {Snapshot Serengeti, high-frequency annotated camera trap images of 40 mammalian species in an African savanna},
volume = {2},
issn = {2052-4463},
doi = {10.1038/sdata.2015.26},
abstract = {Camera traps can be used to address large-scale questions in community ecology by providing systematic data on an array of wide-ranging species. We deployed 225 camera traps across 1,125 km2 in Serengeti National Park, Tanzania, to evaluate spatial and temporal inter-species dynamics. The cameras have operated continuously since 2010 and had accumulated 99,241 camera-trap days and produced 1.2 million sets of pictures by 2013. Members of the general public classified the images via the citizen-science website www.snapshotserengeti.org. Multiple users viewed each image and recorded the species, number of individuals, associated behaviours, and presence of young. Over 28,000 registered users contributed 10.8 million classifications. We applied a simple algorithm to aggregate these individual classifications into a final ‘consensus’ dataset, yielding a final classification for each image and a measure of agreement among individual answers. The consensus classifications and raw imagery provide an unparalleled opportunity to investigate multi-species dynamics in an intact ecosystem and a valuable resource for machine-learning and computer-vision research.},
journaltitle = {Scientific Data},
shortjournal = {Sci Data},
author = {Swanson, Alexandra and Kosmala, Margaret and Lintott, Chris and Simpson, Robert and Smith, Arfon and Packer, Craig},
date = {2015-06-09},
pmid = {26097743},
pmcid = {PMC4460915},
file = {Swanson et al_2015_Snapshot Serengeti, high-frequency annotated camera trap images of 40 mammalian.pdf:C\:\\Users\\Peter\\Dropbox\\papers\\Scientific Data2015\\Swanson et al_2015_Snapshot Serengeti, high-frequency annotated camera trap images of 40 mammalian.pdf:application/pdf}
}
@inproceedings{eveleigh_i_2013,
title = {I want to be a captain! i want to be a captain!: gamification in the old weather citizen science project},
shorttitle = {I want to be a captain! i want to be a captain!},
pages = {79--82},
booktitle = {Proceedings of the First International Conference on Gameful Design, Research, and Applications},
publisher = {{ACM}},
author = {Eveleigh, Alexandra and Jennett, Charlene and Lynn, Stuart and Cox, Anna L.},
date = {2013},
file = {Eveleigh et al_2013_I want to be a captain.pdf:C\:\\Users\\Peter\\Dropbox\\papers\\ACM2013\\Eveleigh et al_2013_I want to be a captain.pdf:application/pdf;Snapshot:C\:\\Users\\Peter\\AppData\\Roaming\\Zotero\\Zotero\\Profiles\\zec9madg.default\\zotero\\storage\\SQAP38A6\\citation.html:text/html}
}
@article{chiesura_introducing_2015,
title = {Introducing {LibCrowds}: a crowdsourcing platform aimed at enhancing access to British Library collections},
shorttitle = {Introducing {LibCrowds}},
author = {Chiesura, Sara and Gallop, Annabel and Mendes, Alex and Mc Gregor, Nora},
date = {2015-06-08},
file = {[HTML] from typepad.co.uk:C\:\\Users\\Peter\\AppData\\Roaming\\Zotero\\Zotero\\Profiles\\zec9madg.default\\zotero\\storage\\EGNBXDVF\\malay.html:text/html}
}
@inproceedings{resnick_grouplens_1994,
title = {{GroupLens}},
isbn = {0-89791-689-1},
doi = {10.1145/192844.192905},
abstract = {Collaborative filters help people make choices based on the opinions of other people. {GroupLens} is a system for collaborative filtering of netnews, to help people find articles they will like in the huge stream of available articles. News reader clients display predicted scores and make it easy for users to rate articles after they read them. Rating servers, called Better Bit Bureaus, gather and disseminate the ratings. The rating servers predict scores based on the heuristic that people who agreed in the past will probably agree again. Users can protect their privacy by entering ratings under pseudonyms, without reducing the effectiveness of the score prediction. The entire architecture is open: alternative software for news clients and Better Bit Bureaus can be developed independently and can interoperate with the components we have developed.},
eventtitle = {{CSCW} '94},
pages = {175--186},
booktitle = {Proceedings of the 1994 {ACM} conference on Computer supported cooperative work},
publisher = {{ACM} Press},
author = {Resnick, Paul and Iacovou, Neophytos and Suchak, Mitesh and Bergstrom, Peter and Riedl, John},
date = {1994},
keywords = {candidates, Collaborative filtering},
file = {Resnick et al. - 1994 - GroupLens.html:C\:\\Users\\Peter\\AppData\\Roaming\\Zotero\\Zotero\\Profiles\\zec9madg.default\\zotero\\storage\\PR8WT5E6\\Resnick et al. - 1994 - GroupLens.html:text/html}
}
@online{gardner_nine_2011,
title = {Nine Reasons Women Don't Edit Wikipedia (in their own words)},
abstract = {The New York Times piece on Wikipedia’s gender gap has given rise to dozens of great online conversations about why so few women edit Wikipedia. I've been reading {ALL} of it, because I believe we ne...},
titleaddon = {Sue Gardner's Blog},
author = {Gardner, Sue},
urldate = {2015-08-07},
date = {2011-02-19},
keywords = {{citeDiss}},
file = {Snapshot:C\:\\Users\\Peter\\AppData\\Roaming\\Zotero\\Zotero\\Profiles\\zec9madg.default\\zotero\\storage\\WI37G4R3\\nine-reasons-why-women-dont-edit-wikipedia-in-their-own-words.html:text/html}
}
@article{wellman_social_2003,
title = {The Social Affordances of the Internet for Networked Individualism},
volume = {8},
issn = {1083-6101},
doi = {10.1111/j.1083-6101.2003.tb00216.x},
abstract = {We review the evidence from a number of surveys in which our {NetLab} has been involved about the extent to which the Internet is transforming or enhancing community. The studies show that the Internet is used for connectivity locally as well as globally, although the nature of its use varies in different countries. Internet use is adding on to other forms of communication, rather than replacing them. Internet use is reinforcing the pre-existing turn to societies in the developed world that are organized around networked individualism rather than group or local solidarities. The result has important implications for civic involvement.},
pages = {0--0},
number = {3},
journaltitle = {Journal of Computer-Mediated Communication},
author = {Wellman, Barry and Quan-Haase, Anabel and Boase, Jeffrey and Chen, Wenhong and Hampton, Keith and Díaz, Isabel and Miyata, Kakuko},
date = {2003-04-01},
langid = {english},
keywords = {{citeDiss}},
file = {Snapshot:C\:\\Users\\Peter\\AppData\\Roaming\\Zotero\\Zotero\\Profiles\\zec9madg.default\\zotero\\storage\\85EQRN7K\\abstract.html:text/html}
}
@article{muchnik_origins_2013,
title = {Origins of power-law degree distribution in the heterogeneity of human activity in social networks},
volume = {3},
rights = {© 2013 Macmillan Publishers Limited. All rights reserved},
doi = {10.1038/srep01783},
abstract = {The probability distribution of number of ties of an individual in a social network follows a scale-free power-law. However, how this distribution arises has not been conclusively demonstrated in direct analyses of people's actions in social networks. Here, we perform a causal inference analysis and find an underlying cause for this phenomenon. Our analysis indicates that heavy-tailed degree distribution is causally determined by similarly skewed distribution of human activity. Specifically, the degree of an individual is entirely random - following a “maximum entropy attachment” model - except for its mean value which depends deterministically on the volume of the users' activity. This relation cannot be explained by interactive models, like preferential attachment, since the observed actions are not likely to be caused by interactions with other people.},
journaltitle = {Scientific Reports},
shortjournal = {Sci. Rep.},
author = {Muchnik, Lev and Pei, Sen and Parra, Lucas C. and Reis, Saulo D. S. and Andrade Jr, José S. and Havlin, Shlomo and Makse, Hernán A.},
date = {2013-05-07},
langid = {english},
keywords = {Applied physics, {citeDiss}, Complex networks}
}
@inbook{lavrakas_intercoder_2008,
location = {Thousand Oaks, {CA}, {USA}},
title = {Intercoder Reliability},
isbn = {978-1-4129-1808-4 978-1-4129-6394-7},
booktitle = {Encyclopedia of Survey Research Methods},
publisher = {{SAGE} Publications, Inc.},
author = {Cho, Young Ik},
bookauthor = {Lavrakas, Paul},
date = {2008},
keywords = {{citeDiss}}
}
@article{kittur_crowdsourcing_2008,
title = {Crowdsourcing for usability: Using micro-task markets for rapid, remote, and low-cost user measurements},
shorttitle = {Crowdsourcing for usability},
journaltitle = {Proc. {CHI} 2008},
author = {Kittur, Aniket and Chi, E. and Suh, Bongwon},
date = {2008},
keywords = {{citeDiss}}
}
@inproceedings{ambati_towards_2011,
title = {Towards Task Recommendation in Micro-Task Markets.},
pages = {1--4},
booktitle = {Human computation},
publisher = {Citeseer},
author = {Ambati, Vamshi and Vogel, Stephan and Carbonell, Jaime G.},
date = {2011},
keywords = {{citeDiss}},
file = {Ambati et al_2011_Towards Task Recommendation in Micro-Task Markets.pdf:C\:\\Users\\Peter\\Dropbox\\papers\\Citeseer2011\\Ambati et al_2011_Towards Task Recommendation in Micro-Task Markets.pdf:application/pdf}
}
@misc{_guidelines_2014,
title = {Guidelines for Academic Requesters},
url = {http://wiki.wearedynamo.org/index.php/Guidelines_for_Academic_Requesters},
publisher = {Dynamo Wiki},
date = {2014},
keywords = {{citeDiss}}
}
@inproceedings{sen_quest_2007,
location = {New York, {NY}, {USA}},
title = {The Quest for Quality Tags},
isbn = {978-1-59593-845-9},
doi = {10.1145/1316624.1316678},
series = {{GROUP} '07},
abstract = {Many online communities use tags - community selected words or phrases - to help people find what they desire. The quality of tags varies widely, from tags that capture akey dimension of an entity to those that are profane, useless, or unintelligible. Tagging systems must often select a subset of available tags to display to users due to limited screen space. Because users often spread tags they have seen, selecting good tags not only improves an individual's view of tags, it also encourages them to create better tags in the future. We explore implicit (behavioral) and explicit (rating) mechanisms for determining tag quality. Based on 102,056 tag ratings and survey responses collected from 1,039 users over 100 days, we offer simple suggestions to designers of online communities to improve the quality of tags seen by their users.},
pages = {361--370},
booktitle = {Proceedings of the 2007 International {ACM} Conference on Supporting Group Work},
publisher = {{ACM}},
author = {Sen, Shilad and Harper, F. Maxwell and {LaPitz}, Adam and Riedl, John},
date = {2007},
keywords = {{citeDiss}, moderation, tagging, user interfaces},
file = {Sen et al_2007_The Quest for Quality Tags.pdf:C\:\\Users\\Peter\\Dropbox\\papers\\ACM2007\\Sen et al_2007_The Quest for Quality Tags.pdf:application/pdf}
}
@inproceedings{mitra_comparing_2015,
title = {Comparing Person-and Process-centric Strategies for Obtaining Quality Data on Amazon Mechanical Turk},
pages = {1345--1354},
booktitle = {Proceedings of the 33rd Annual {ACM} Conference on Human Factors in Computing Systems},
publisher = {{ACM}},
author = {Mitra, Tanushree and Hutto, C. J. and Gilbert, Eric},
date = {2015},
keywords = {{citeDiss}},
file = {Mitra et al_2015_Comparing Person-and Process-centric Strategies for Obtaining Quality Data on.pdf:C\:\\Users\\Peter\\Dropbox\\papers\\ACM2015\\Mitra et al_2015_Comparing Person-and Process-centric Strategies for Obtaining Quality Data on.pdf:application/pdf}
}
@article{hofmann_latent_2004,
title = {Latent Semantic Models for Collaborative Filtering},
volume = {22},
issn = {1046-8188},
doi = {10.1145/963770.963774},
abstract = {Collaborative filtering aims at learning predictive models of user preferences, interests or behavior from community data, that is, a database of available user preferences. In this article, we describe a new family of model-based algorithms designed for this task. These algorithms rely on a statistical modelling technique that introduces latent class variables in a mixture model setting to discover user communities and prototypical interest profiles. We investigate several variations to deal with discrete and continuous response variables as well as with different objective functions. The main advantages of this technique over standard memory-based methods are higher accuracy, constant time prediction, and an explicit and compact model representation. The latter can also be used to mine for user communitites. The experimental evaluation shows that substantial improvements in accucracy over existing methods and published results can be obtained.},
pages = {89--115},
number = {1},
journaltitle = {{ACM} Transactions on Information Systems},
author = {Hofmann, Thomas},
date = {2004-01},
keywords = {{citeDiss}, {citeDissProp}},
file = {Hofmann - 2004 - Latent Semantic Models for Collaborative Filtering.pdf:C\:\\Users\\Peter\\Dropbox\\papers\\Hofmann - 2004 - Latent Semantic Models for Collaborative Filtering.pdf:application/pdf}
}
@inproceedings{organisciak_improving_2015,
location = {Knoxville, {TN}},
title = {Improving Consistency of Crowdsourced Multimedia Similarity for Evaluation},
series = {{JCDL} '15},
eventtitle = {Joint Conference on Digital Libraries 2015},
publisher = {{ACM}},
author = {Organisciak, Peter and Downie, J. Stephen},
date = {2015-06},
keywords = {{citeDiss}}
}
@inproceedings{lee_survey_2004,
title = {Survey Of Music Information Needs, Uses, And Seeking Behaviours: Preliminary Findings.},
volume = {2004},
shorttitle = {Survey Of Music Information Needs, Uses, And Seeking Behaviours},
pages = {5th},
booktitle = {{ISMIR}},
publisher = {Citeseer},
author = {Lee, Jin Ha and Downie, J. Stephen},
date = {2004},
keywords = {{citeDiss}}
}
@article{polk_rating_2002,
title = {Rating the similarity of simple perceptual stimuli: asymmetries induced by manipulating exposure frequency},
volume = {82},
issn = {0010-0277},
shorttitle = {Rating the similarity of simple perceptual stimuli},
abstract = {When judging the similarity of two stimuli, people's ratings often differ depending on the order in which the comparison is presented (A vs. B or B vs. A). Such directional asymmetries have typically been demonstrated using complex concepts that have a large number of semantic features and a standard explanation is that different sets of features are emphasized depending on the direction of the comparison. In this study, we show that directional asymmetries in the similarity of simple perceptual stimuli can be predictably manipulated merely by presenting each member of a pair with different frequency. Participants rated the similarity of color patches before and after performing an irrelevant training task in which a subset of colors was presented ten times more frequently than others. The similarity ratings after training were significantly more asymmetric than the ratings before training. We discuss the implications of these findings for models of similarity judgment and propose a computationally explicit explanation based on asymmetries in representational stability.},
pages = {B75--88},
number = {3},
journaltitle = {Cognition},
shortjournal = {Cognition},
author = {Polk, Thad A. and Behensky, Charles and Gonzalez, Richard and Smith, Edward E.},
date = {2002-01},
pmid = {11747865},
keywords = {Adult, attention, {citeDiss}, Color Perception, Concept Formation, Discrimination Learning, Female, Humans, Male, Mental Recall, Neural Networks (Computer)}
}
@article{tversky_features_1977,
title = {Features of similarity},
volume = {84},
rights = {(c) 2012 {APA}, all rights reserved},
issn = {1939-1471(Electronic);0033-295X(Print)},
doi = {10.1037/0033-295X.84.4.327},
abstract = {Questions the metric and dimensional assumptions that underlie the geometric representation of similarity on both theoretical and empirical grounds. A new set-theoretical approach to similarity is developed in which objects are represented as collections of features and similarity is described as a feature-matching process. Specifically, a set of qualitative assumptions is shown to imply the contrast model, which expresses the similarity between objects as a linear combination of the measures of their common and distinctive features. Several predictions of the contrast model are tested in studies of similarity with both semantic and perceptual stimuli. The model is used to uncover, analyze, and explain a variety of empirical phenomena such as the role of common and distinctive features, the relations between judgments of similarity and difference, the presence of asymmetric similarities, and the effects of context on judgments of similarity. The contrast model generalizes standard representations of similarity data in terms of clusters and trees. It is also used to analyze the relations of prototypicality and family resemblance. (39 ref)},
pages = {327--352},
number = {4},
journaltitle = {Psychological Review},
author = {Tversky, Amos},
date = {1977},
keywords = {*Cognitive Processes, *Pattern Discrimination, *Stimulus Discrimination, {citeDiss}, Stimulus Similarity}
}
@article{marsden_interrogating_2012,
title = {Interrogating Melodic Similarity: A Definitive Phenomenon or the Product of Interpretation?},
volume = {41},
issn = {0929-8215},
doi = {10.1080/09298215.2012.740051},
shorttitle = {Interrogating Melodic Similarity},
abstract = {The nature of melodic similarity is interrogated through a survey of the different means by which the phenomenon has been studied, examination of methods for measuring melodic similarity, a Monte Carlo analysis of data from the experiment which formed the basis for the ‘ground truth’ used in the {MIREX} 2005 contest on melodic similarity, and examples of interest in the music of Mozart. Melodic similarity has been studied by a number of means, sometimes quite contrasting, which lead to important differences in the light of the finding that similarity is dependent on context. Models of melodic similarity based on reduction show that the existence of multiple possible reductions forms a natural basis for similarity to depend on interpretation. Examination of the {MIREX} 2005 data shows wide variations in subjects' judgements of melodic similarity and some evidence that the perceived similarity between two melodies can be influenced by the presence of a third melody. Examples from Mozart suggest that he deliberately exploited the possibilities inherent in recognizing similarity through different interpretations. It is therefore proposed that similarity be thought of not as a distinct and definite function of two melodies but as something created in the minds of those who hear the melodies.},
pages = {323--335},
number = {4},
journaltitle = {Journal of New Music Research},
author = {Marsden, Alan},
date = {2012-12-01},
keywords = {{citeDiss}},
file = {Snapshot:C\:\\Users\\Peter\\AppData\\Roaming\\Zotero\\Zotero\\Profiles\\zec9madg.default\\zotero\\storage\\33XZXZJG\\09298215.2012.html:text/html}
}
@article{katter_influence_1968,
title = {The influence of scale form on relevance judgments},
volume = {4},
issn = {0020-0271},
doi = {10.1016/0020-0271(68)90002-8},
abstract = {This paper reports the results of two studies. The first compared ranking and category rating procedures for measuring relevance of documents to information requirement statements. The comparison measure was number of reversals; the condition where document-requirement pair A is measured as more relevant than pair B by one procedure and as less relevant than pair B by the other. As compared to category rating, ranking produced three times the expected number of reversals. The results are explained in terms of a “cascaded distortion process” that can affect any procedure which arbitrarily restricts distribution shape.
The second study compared the stimulus range and anchoring sensitivities of a nine-point category scale and a magnitude-ratio scale procedure. Results from the category scale were more consistent and more as predicted. Magnitude ratio results were distorted by unrepresentative scale moduli selected by about one-sixth of the judges, a condition which may be correctable. Suggestions for improved anchoring procedures are discussed in light of the findings for the anchoring treatment.},
pages = {1--11},
number = {1},
journaltitle = {Information Storage and Retrieval},
shortjournal = {Information Storage and Retrieval},
author = {Katter, R. V.},
date = {1968-03},
keywords = {{citeDiss}},
file = {ScienceDirect Snapshot:C\:\\Users\\Peter\\AppData\\Roaming\\Zotero\\Zotero\\Profiles\\zec9madg.default\\zotero\\storage\\QXMCQ3RA\\0020027168900028.html:text/html}
}
@inproceedings{efron_building_2011,
location = {New Orleans, {USA}},
title = {Building Topic Models in a Federated Digital Library Through Selective Document Exclusion},
series = {{ASIS}\&T '11},
eventtitle = {{ASIS}\&T Annual Meeting},
booktitle = {Proceedings of the American Society for Information Science and Technology},
author = {Efron, Miles and Organisciak, Peter and Fenlon, Katrina},
date = {2011-10},
keywords = {{citeDiss}, {hcirCITE}},
file = {Snapshot:C\:\\Users\\Peter\\AppData\\Roaming\\Zotero\\Zotero\\Profiles\\zec9madg.default\\zotero\\storage\\7R82INVG\\full.html:text/html}
}
@inproceedings{efron_improving_2012,
location = {New York, {NY}, {USA}},
title = {Improving Retrieval of Short Texts Through Document Expansion},
isbn = {978-1-4503-1472-5},
doi = {10.1145/2348283.2348405},
series = {{SIGIR} '12},
abstract = {Collections containing a large number of short documents are becoming increasingly common. As these collections grow in number and size, providing effective retrieval of brief texts presents a significant research problem. We propose a novel approach to improving information retrieval ({IR}) for short texts based on aggressive document expansion. Starting from the hypothesis that short documents tend to be about a single topic, we submit documents as pseudo-queries and analyze the results to learn about the documents themselves. Document expansion helps in this context because short documents yield little in the way of term frequency information. However, as we show, the proposed technique helps us model not only lexical properties, but also temporal properties of documents. We present experimental results using a corpus of microblog (Twitter) data and a corpus of metadata records from a federated digital library. With respect to established baselines, results of these experiments show that applying our proposed document expansion method yields significant improvements in effectiveness. Specifically, our method improves the lexical representation of documents and the ability to let time influence retrieval.},
pages = {911--920},
booktitle = {Proceedings of the 35th International {ACM} {SIGIR} Conference on Research and Development in Information Retrieval},
publisher = {{ACM}},
author = {Efron, Miles and Organisciak, Peter and Fenlon, Katrina},
date = {2012},
keywords = {{citeDiss}, document expansion, dublin core, {hcirCITE}, {INFORMATION} retrieval, language models, microblogs, temporal {IR}, twitter}
}
@inproceedings{little_turkit_2009,
location = {New York, {NY}, {USA}},
title = {{TurKit}: Tools for Iterative Tasks on Mechanical Turk},
isbn = {978-1-60558-672-4},
doi = {10.1145/1600150.1600159},
series = {{HCOMP} '09},
shorttitle = {{TurKit}},
abstract = {Mechanical Turk ({MTurk}) is an increasingly popular web service for paying people small rewards to do human computation tasks. Current uses of {MTurk} typically post independent parallel tasks. We are exploring an alternative iterative paradigm, in which workers build on or evaluate each other's work. We describe {TurKit}, a new toolkit for deploying iterative tasks to {MTurk}, with a familiar imperative programming paradigm that effectively uses {MTurk} workers as subroutines.},
pages = {29--30},
booktitle = {Proceedings of the {ACM} {SIGKDD} Workshop on Human Computation},
publisher = {{ACM}},
author = {Little, Greg and Chilton, Lydia B. and Goldman, Max and Miller, Robert C.},
date = {2009},
keywords = {{citeDiss}, {citeDissProp}, human computation, mechanical turk, toolkit}
}
@book{simon_participatory_2010,
title = {The participatory museum},
publisher = {Museum 2.0},
author = {Simon, Nina},
date = {2010},
keywords = {{citeDiss}},
file = {[HTML] from google.com:C\:\\Users\\Peter\\AppData\\Roaming\\Zotero\\Zotero\\Profiles\\zec9madg.default\\zotero\\storage\\HE9HVAW9\\books.html:text/html}
}
@inproceedings{wiggins_goals_2012,
title = {Goals and Tasks: Two Typologies of Citizen Science Projects},
doi = {10.1109/HICSS.2012.295},
shorttitle = {Goals and Tasks},
abstract = {Citizen science is a form of research collaboration involving members of the public in scientific research projects to address real-world problems. Often organized as a virtual collaboration, these projects are a type of open movement, with collective goals addressed through open participation in research tasks. We conducted a survey of citizen science projects to elicit multiple aspects of project design and operation. We then clustered projects based on the tasks performed by participants and on the project's stated goals. The clustering results group projects that show similarities along other dimensions, suggesting useful divisions of the projects.},
eventtitle = {2012 45th Hawaii International Conference on System Science ({HICSS})},
pages = {3426--3435},
booktitle = {2012 45th Hawaii International Conference on System Science ({HICSS})},
author = {Wiggins, A and Crowston, Kevin},
date = {2012-01},
keywords = {Approximation methods, {citeDiss}, Citizen science, citizen science project, Collaboration, Communities, Educational institutions, Electronic mail, groupware, Monitoring, open movement, Production, project design, project operation, real-world problem, research collaboration, scientific information systems, scientific research project, virtual collaboration},
file = {IEEE Xplore Abstract Record:C\:\\Users\\Peter\\AppData\\Roaming\\Zotero\\Zotero\\Profiles\\zec9madg.default\\zotero\\storage\\NJQZCP74\\Wiggins and Crowston - 2012 - Goals and Tasks Two Typologies of Citizen Science.html:text/html}
}
@article{von_ahn_recaptcha_2008,
title = {recaptcha: Human-based character recognition via web security measures},
volume = {321},
shorttitle = {recaptcha},
pages = {1465--1468},
number = {5895},
journaltitle = {Science},
author = {von Ahn, Luis and Maurer, Benjamin and {McMillen}, Colin and Abraham, David and Blum, Manuel},
date = {2008},
keywords = {{citeDiss}, {citeDissProp}},
file = {[HTML] from sciencemag.org:C\:\\Users\\Peter\\AppData\\Roaming\\Zotero\\Zotero\\Profiles\\zec9madg.default\\zotero\\storage\\NEKH8S8Q\\1465.html:text/html}
}
@article{khatib_algorithm_2011,