-
Notifications
You must be signed in to change notification settings - Fork 0
/
references.bib
6404 lines (5488 loc) · 207 KB
/
references.bib
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
%% Created using Papers on Mon, 13 Jun 2016.
%% http://papersapp.com/papers/
@article{Boykov:2001de,
author = {Boykov, Y and Veksler, O and Zabih, R},
title = {{Fast approximate energy minimization via graph cuts}},
journal = {Pattern Analysis and Machine Intelligence, IEEE Transactions on},
year = {2001},
volume = {23},
number = {11},
pages = {1222--1239}
}
@inproceedings{Borst:2003ch,
author = {Borst, C and Fischer, M and Hirzinger, G},
title = {{Grasping the dice by dicing the grasp}},
booktitle = {2003 IEEE/RSJ International Conference on Intelligent Robots and Systems},
year = {2003},
pages = {3692--3697}
}
@article{Thrun:1998ex,
author = {Thrun, Sebastian and Burgard, Wolfram and Fox, Dieter},
title = {{A Probabilistic Approach to Concurrent Mapping and Localization for Mobile Robots}},
journal = {Autonomous Robots},
year = {1998},
volume = {5},
number = {3/4},
pages = {253--271}
}
@inproceedings{Jaakkola00tutorialon,
author = {Jaakkola, Tommi S},
title = {{Tutorial on Variational Approximation Methods}},
booktitle = {In Advanced Mean Field Methods: Theory and Practice},
year = {2000},
pages = {129--159},
publisher = {MIT Press}
}
@article{Pan:2010wx,
author = {Pan, S J and Yang, Q},
title = {{A Survey on Transfer Learning}},
journal = {{\ldots} and Data Engineering},
year = {2010}
}
@article{Tzikas:2008fu,
author = {Tzikas, D G and Likas, A C and Galatsanos, N P},
title = {{The variational approximation for Bayesian inference}},
journal = {Signal Processing Magazine, IEEE},
year = {2008},
volume = {25},
number = {6},
pages = {131--146}
}
@article{Rosales:2010gl,
author = {Rosales, C and Ros, L and Porta, J M and Suarez, R},
title = {{Synthesizing Grasp Configurations with Specified Contact Regions}},
journal = {The International Journal of Robotics Research},
year = {2010},
month = jul
}
@inproceedings{madry2012ICRA_SPME,
author = {Madry, Marianna and Song, Dan and Ek, Carl Henrik and Kragic, Danica},
title = {{''Robot bring me something to drink from": object representation for transferring task specific grasps}},
booktitle = {The ICRA'12 Workshop on Semantic Perception, Mapping and Exploration (SPME)},
year = {2012}
}
@article{Yuruten:2013hr,
author = {Yuruten, O and Sahin, E and Kalkan, S},
title = {{The learning of adjectives and nouns from affordance and appearance features}},
journal = {Adaptive Behavior},
year = {2013},
volume = {21},
number = {6},
pages = {437--451},
month = nov
}
@inproceedings{detry2013ICRA,
author = {Detry, Renaud and Ek, Carl Henrik and Madry, Marianna and Kragic, Danica},
title = {{Compressing Grasping Experience into a Dictionary of Prototypical Grasp-predicting Parts}},
booktitle = {The 5th International Workshop on Human-Friendly Robotics},
year = {2012},
month = oct
}
@article{Oztop:2004ed,
author = {Oztop, Erhan and Bradley, NinaS and Arbib, MichaelA},
title = {{Infant grasp learning: a computational model}},
journal = {Experimental Brain Research},
year = {2004},
volume = {158},
number = {4},
pages = {480--503},
month = jun
}
@inproceedings{madry2012ICRA,
author = {Madry, Marianna and Song, Dan and Kragic, Danica},
title = {{D/3D Object Categorization for Task Based Grasping}},
booktitle = {European Robotics Forum 2011: RGB-D Workshop on 3D Perception in Robotics},
year = {2011},
month = apr,
annote = {extended abstract}
}
@article{Rosch:1976cc,
author = {Rosch, Eleanor and Mervis, Carolyn B and Gray, Wayne D and Johnson, David M and Boyes-Braem, Penny},
title = {{Basic objects in natural categories}},
journal = {Cognitive psychology},
year = {1976},
volume = {8},
number = {3},
pages = {382--439},
month = jul
}
@article{Qian:2012ta,
author = {Qian, X and Tang, Y Yan and Yan, Z and Hang, Kaiyu},
title = {{ISABoost: A weak classifier inner structure adjusting based AdaBoost algorithm---ISABoost based application in scene categorization}},
journal = {Neurocomputing},
year = {2012}
}
@inproceedings{Song:2011cy,
author = {Song, Dan and Ek, Carl Henrik and Huebner, Kai and Kragic, Danica},
title = {{Multivariate discretization for Bayesian Network structure learning in robot grasping}},
booktitle = {2011 IEEE International Conference on Robotics and Automation},
year = {2011},
pages = {1944--1950}
}
@article{Argall:2009hh,
author = {Argall, Brenna D and Chernova, Sonia and Veloso, Manuela and Browning, Brett},
title = {{A survey of robot learning from demonstration}},
journal = {Robotics and Autonomous Systems},
year = {2009},
volume = {57},
number = {5},
pages = {469--483},
month = may
}
@article{Ruhnke:2013tt,
author = {Ruhnke, M and Bo, L and Fox, Dieter and Burgard, Wolfram},
title = {{Compact RGBD Surface Models Based on Sparse Coding}},
year = {2013}
}
@inproceedings{Detry:vc,
author = {Detry, Renaud and Hjelm, Martin and Ek, Carl Henrik and Kragic, Danica},
title = {{Generalizing Task Parameters Through Modularization}},
booktitle = {ICRA Workshop on Autonomous Learning}
}
@article{Borst:2004wf,
author = {Borst, C and Fischer, M and Hirzinger, G},
title = {{Grasp Planning: How to Choose a Suitable Task Wrench Space}},
journal = {Robotics {\&} Automation {\ldots}},
year = {2004}
}
@article{Wang:2012uo,
author = {Wang, Chong and Blei, David M.},
title = {{Variational Inference in Nonconjugate Models}},
journal = {arXiv.org},
year = {2012},
eprint = {1209.4360v4},
eprinttype = {arxiv},
eprintclass = {stat.ML},
month = sep
}
@inproceedings{detry2010c,
author = {Detry, Renaud and Piater, Justus},
title = {{Continuous Surface-point Distributions for 3D Object Pose Estimation and Recognition}},
booktitle = {Asian Conference on Computer Vision},
year = {2010},
pages = {572--585},
annote = {
Basic idea: model the object in 3D by computing a probability distribution acrross it surface. The proability distributions is calculated by using KDE on samples from the object.
}
}
@inproceedings{Griffith:2009cm,
author = {Griffith, S and Sinapov, J and Miller, M and Stoytchev, A},
title = {{Toward interactive learning of object categories by a robot: A case study with container and non-container objects}},
booktitle = {Development and Learning, 2009. ICDL 2009. IEEE 8th International Conference on},
year = {2009},
pages = {1--6},
annote = {<b>Summary:</b>
Problem: To learn a robot from sensory-motor experince what is a container and not a container. And to use the sensory-motor experience to classfiy novel objects to a specific category.
The robot drops a cube into a container that is either up or up-side down and oberseves the outcome. It then tries to push the container and depedning on the co-movement or no co-movement with the cube it can learn a functional representation of the object.
In some sense this is clustering based upon outcome experience rather than then clustering of features; so there is a temporal aspect to it that is interesting.
The not so cool part is that the clustering into the two groups container and not a container is not so convincing, and that the classificiation that they do on novel objects based upon the image features they extracted are kind of riddiciolous.
}
}
@inproceedings{Tsai:2011kd,
author = {Tsai, G and Xu, Changhai and Liu, Jingen and Kuipers, Benjamin J},
title = {{Real-time indoor scene understanding using Bayesian filtering with motion cues}},
booktitle = {Computer Vision (ICCV), 2011 IEEE International Conference on},
year = {2011},
pages = {121--128}
}
@article{Bo:2011ve,
author = {Bo, L and Ren, X and Fox, Dieter},
title = {{Hierarchical matching pursuit for image classification: Architecture and fast algorithms}},
journal = {Advances in Neural Information {\ldots}},
year = {2011}
}
@inproceedings{Singhi:2006jz,
author = {Singhi, Surendra K and Liu, Huan},
title = {{Feature subset selection bias for classification learning}},
booktitle = {ICML '06: Proceedings of the 23rd international conference on Machine learning},
year = {2006},
publisher = { ACM},
month = jun
}
@article{McCarty:2001dr,
author = {McCarty, Michael E and Clifton, Rachel K and Ashmead, Daniel H and Lee, Philip and Goubet, Nathalie},
title = {{How Infants Use Vision for Grasping Objects}},
journal = {Child Development},
year = {2001},
volume = {72},
number = {4},
pages = {973--987},
month = aug
}
@inproceedings{Thrun:2000il,
author = {Thrun, Sebastian and Burgard, Wolfram and Fox, Dieter},
title = {{A real-time algorithm for mobile robot mapping with applications to multi-robot and 3D mapping}},
booktitle = {2000 IEEE International Conference on Robotics and Automation},
year = {2000},
pages = {321--328}
}
@article{Afkham:2008ez,
author = {Afkham, H M and Targhi, A T and Eklundh, J-O and Pronobis, A},
title = {{Joint visual vocabulary for animal classification}},
journal = {International Conference on Pattern Recognition. Proceedings},
year = {2008},
pages = {1--4},
month = dec
}
@inproceedings{Gienger:2008gk,
author = {Gienger, M and Toussaint, M and Goerick, C},
title = {{Task maps in humanoid robot manipulation}},
booktitle = {2008 IEEE/RSJ International Conference on Intelligent Robots and Systems},
year = {2008},
pages = {2758--2764}
}
@article{Widynski:2014dc,
author = {Widynski, Nicolas and Moevus, Antoine and Mignotte, Max},
title = {{Local symmetry detection in natural images using a particle filtering approach.}},
journal = {IEEE transactions on image processing : a publication of the IEEE Signal Processing Society},
year = {2014},
volume = {23},
number = {12},
pages = {5309--5322},
month = dec
}
@book{Hastie:2009wp,
author = {Hastie, Trevor and Tibshirani, Robert and Friedman, Jerome},
title = {{The Elements of Statistical Learning}},
publisher = {Springer},
year = {2009},
series = {Data Mining, Inference, and Prediction, Second Edition},
month = aug,
annote = {Consider minimizing D∗ subject to ||$\beta$|| = 1. Describe this criterion in words. Does it solve the optimal separating hyperplane problem?
}
}
@article{Billard:2006vb,
author = {Billard, A G and Calinon, S and Guenter, F},
title = {{Discriminative and adaptive imitation in uni-manual and bi-manual tasks}},
journal = {Robotics and Autonomous Systems},
year = {2006}
}
@inproceedings{Geiger:2009bc,
author = {Geiger, Andreas and Urtasun, Raquel and Darrell, Trevor J},
title = {{Rank priors for continuous non-linear dimensionality reduction}},
booktitle = {Computer Vision and Pattern Recognition (CVPR), 2009 IEEE Conference on},
year = {2009},
pages = {880--887}
}
@book{Heckerman:2008fh,
author = {Heckerman, David},
editor = {Holmes, Dawn E and Jain, Lakhmi C},
title = {{Studies in Computational Intelligence}},
publisher = {Springer Berlin Heidelberg},
year = {2008},
volume = {156},
series = {Studies in Computational Intelligence},
address = {Berlin, Heidelberg}
}
@article{Gelman:2002wx,
author = {Gelman, Andrew},
title = {{Prior Distribution}},
journal = {Encyclopedia of Environmetrics},
year = {2002},
volume = {3},
pages = {1634--1637},
month = apr
}
@inproceedings{Geiger:2011il,
author = {Geiger, Andreas and Lauer, M and Urtasun, Raquel},
title = {{A generative model for 3D urban scene understanding from movable platforms}},
booktitle = {Computer Vision and Pattern Recognition (CVPR), 2011 IEEE Conference on},
year = {2011},
pages = {1945--1952}
}
@article{Gelman:1996ul,
author = {Gelman, Andrew},
title = {{Bayesian Model-Building By Pure Thought: Some Principles And Examples}},
journal = {Statistica Sinica},
year = {1996},
volume = {6},
pages = {215--232},
month = apr
}
@article{AlexJSmola:2001vr,
author = {Smola, Alexander J and Bartlett, Peter},
title = {{Sparse Greedy Gaussian Process Regression}},
year = {2001}
}
@inproceedings{Delong:2010bk,
author = {Delong, A and Osokin, A and Isack, H N and Boykov, Y},
title = {{Fast approximate energy minimization with label costs}},
booktitle = {Computer Vision and Pattern Recognition (CVPR), 2010 IEEE Conference on},
year = {2010},
pages = {2173--2180}
}
@article{Sutton:2010we,
author = {Sutton, Charles and McCallum, Andrew},
title = {{An Introduction to Conditional Random Fields}},
journal = {arXiv.org},
year = {2010},
eprint = {1011.4088v1},
eprinttype = {arxiv},
eprintclass = {stat.ML},
month = nov
}
@inproceedings{Li:1987gj,
author = {Li, Zexiang and Sastry, S},
title = {{Task oriented optimal grasping by multifingered robot hands}},
booktitle = {1987 IEEE International Conference on Robotics and Automation},
year = {1987},
pages = {389--394}
}
@article{Zhou:2011ts,
author = {Zhou, Yang},
title = {{Structure Learning of Probabilistic Graphical Models: A Comprehensive Survey}},
journal = {arXiv.org},
year = {2011},
eprint = {1111.6925v1},
eprinttype = {arxiv},
eprintclass = {stat.ML},
month = nov,
annote = {survey on structure learning}
}
@inproceedings{Stober:2011iv,
author = {Stober, Jeremy and Miikkulainen, Risto and Kuipers, Benjamin J},
title = {{Learning geometry from sensorimotor experience}},
booktitle = {2011 IEEE International Conference on Development and Learning},
year = {2011},
pages = {1--6},
publisher = {IEEE}
}
@article{Sharan:2013cn,
author = {Sharan, Lavanya and Liu, Ce and Rosenholtz, Ruth and Adelson, Edward H},
title = {{Recognizing Materials Using Perceptually Inspired Features}},
journal = {International Journal of Computer Vision},
year = {2013},
volume = {103},
number = {3},
pages = {348--371},
month = feb
}
@article{Argyros:2006in,
author = {Argyros, Antonis A and Lourakis, Manolis I A},
title = {{Vision-Based Interpretation of Hand Gestures for Remote Control of a Computer Mouse}},
journal = {Computer Vision in Human-Computer Interaction},
year = {2006},
volume = {3979},
number = {Chapter 5},
pages = {40--51},
annote = {Thoughts: Where is the line between hardware accelerated research and common simple hardware using algorithmic focused acceleration?
Review:
This paper developes a method for gesture interaction with a mouse / point{\&}amp;click GUI. They hardware used is a simple common webcam on a ordinary computer thus no extra or advanced hardware is used i.e. things lie in the algorithm rather than in the hardware. There are two systems one in 2D and one 3D. Pretty boring.
}
}
@article{Zhang:2004ft,
author = {Zhang, Jianwei and R{\"o}ssler, Bernd},
title = {{Self-valuing learning and generalization with application in visually guided grasping of complex objects}},
journal = {Robotics and Autonomous Systems},
year = {2004},
volume = {47},
number = {2-3},
pages = {117--127},
month = jun
}
@article{Getoor:2007vs,
author = {Getoor, L and Taskar, B},
title = {{Introduction to Statistical Relational Learning - Lise Getoor - Google Books}},
year = {2007}
}
@article{Rothrock:vt,
author = {Rothrock, B and Park, S and Zhu, S C},
title = {{Integrating Grammar and Segmentation for Human Pose Estimation}},
journal = {cs.ucla.edu
}
}
@inproceedings{Wohlkinger:2011da,
author = {Wohlkinger, W and Vincze, M},
title = {{Ensemble of shape functions for 3D object classification}},
booktitle = {Robotics and Biomimetics (ROBIO), 2011 IEEE International Conference on},
year = {2011},
pages = {2987--2992}
}
@inproceedings{Bitzer:2009hn,
author = {Bitzer, Sebastian and Vijayakumar, Sethu},
title = {{Latent Spaces for Dynamic Movement Primitives}},
booktitle = {2009 IEEE-RAS International Conference on Humanoid Robots (Humanoids)},
year = {2009},
pages = {574--581},
publisher = {IEEE}
}
@article{Balasubramanian:2012hb,
author = {Balasubramanian, R and Xu, Ling and Brook, P D and Smith, J R and Matsuoka, Y},
title = {{Physical Human Interactive Guidance: Identifying Grasping Principles From Human-Planned Grasps}},
journal = {Robotics, IEEE Transactions on},
year = {2012},
volume = {28},
number = {4},
pages = {899--910}
}
@inproceedings{Thrun:1999eu,
author = {Thrun, Sebastian and Bennewitz, M and Burgard, Wolfram and Cremers, A B and Dellaert, F and Fox, Dieter and Hahnel, D and Rosenberg, C and Roy, N and Schulte, J and Schulz, D},
title = {{MINERVA: a second-generation museum tour-guide robot}},
booktitle = {1999 IEEE International Conference on Robotics and Automation},
year = {1999},
pages = {1999--2005}
}
@article{Zhou:2014ta,
author = {Zhou, Bolei and Khosla, Aditya and Lapedriza, Agata and Oliva, Aude and Torralba, Antonio},
title = {{Object Detectors Emerge in Deep Scene CNNs}},
journal = {arXiv.org},
year = {2014},
month = dec
}
@article{Neal:2003tm,
author = {Neal, R M},
title = {{Density modeling and clustering using Dirichlet diffusion trees}},
journal = {Bayesian Statistics},
year = {2003}
}
@article{Schenck:2013ts,
author = {Schenck, C and Sinapov, J and Staley, K},
title = {{Grounded Object Individuation
by a Humanoid Robot}},
journal = {engineering.iastate.edu
},
year = {2013},
month = nov
}
@article{James:1997uh,
author = {James, G and Hastie, T},
title = {{Generalizations of the Bias Variance Decomposition for Prediction Error}},
journal = {Dept Statistics},
year = {1997}
}
@article{Kiros:2014wb,
author = {Kiros, Ryan and Salakhutdinov, Ruslan and Zemel, Richard S},
title = {{Unifying Visual-Semantic Embeddings with Multimodal Neural Language Models}},
journal = {arXiv.org},
year = {2014},
eprint = {1411.2539v1},
eprinttype = {arxiv},
eprintclass = {cs.LG},
month = nov,
annote = {13 pages. NIPS 2014 deep learning workshop}
}
@article{Zabulis:2009tz,
author = {Zabulis, X and Baltzakis, HG and Argyros, Antonis A},
title = {{Vision-based hand gesture recognition for human-computer interaction}},
journal = {The Universal Access Handbook},
year = {2009},
annote = {<b>Some thoughts</b>
Detection is separate from learning and understanding gestures etc. Since all we have to know is how a hand looks like in order to detect it.
Learning and understanding must be put in the context of previously aquired knowledge or combinations of such.
Gestures understanding should be correlated with facial expressions and body poses. Body language. Seems that no one has added this approach from what I have read so far. Imagine having an paralell HMM for facial expressions and pose. Also how about the Tobii eye detecion this is also very related to some gestures like pointing at objects, thinking and showing emotions.
<b>Review</b>
An overview of hand/gesture recognition. The authors identify three building blocks of hand gesture inference: detection, tracking and recognition.
<b>Detection</b> consists of the detection of hands and the segementation of the image to understand the context and remove irrelevant data. There are several features that are used in the detection stage.
- <b>Skin color</b>; which is problematic since there is a lot of variance of the skin color in human beings and there is also lot of different lightning conditions adding up to the ambiguity.
- <b>Shape</b>: Edge detection to find the hands. Often combined with color since there is a lot of ambiguity and occlusion. To deal with the clutter some people have used particle filters. There has also been some research into morphology however it seems kind of rudimentary. I am sure something could be done to enhance the morphology approach.
- <b>Pixel values</b>: the ordinary template matching and boosting approach.
- <b>Motion</b>: seems like this feature is a bit unused except for the motion residue idea that hands move more than other objects in the scene. I guess if one wants to detect the hands one starts at frame 1 and then move on to the next frame. So real time seems a bit difficult maybe more applicable when analyzing a sequence.
<b>Tracking</b>
The tracking part deals with keeping track of where the hands go. Basically so that one does not have to do the detection over again.
- <b>Templates</b>: basically once the hands have been detected that part is used as template for detecting the hand in the next frame. There are also contour blob templates that are deformed to fit the hand contour in the next frame. Good approach but very sensitive to clutter.
- <b>Optimal estimation techniques</b>: Kalman filtering framework. Hard to understand since I have forgotten what Kalman filtering is...
- <b>Mean shift algorithm</b>: should investigate how it works.
- <b>Particle filtering</b> {\&}amp; condensation algorithm to be investigated.
<b>Recognition</b>
Interpreting the semantics that the hand(s) location, posture, or gesture conveys. The paper defines two categories: 1) interpretation of control applications such as drawing lines etc. A bit unclear definition actually. What this should mean is actually action understanding. Right? Or would this get filed under 2 as well. Very ambigious and unclear. 2) Interpretatioon of gestures, postures, signs etc. Then they talk about how this phase is context driven and how HMMs are a good framework for the understanding. Some approaches are outlined below.
- <b>Template matching</b>: Same procedure as with facerecognition. The only difference here is that here we are essentially dealing with a 360 degree object but for faces there is only about 180 which certainly makes recognition a bit harder. A lot of people seems to be doing multiple views templates plus a coordination with previous frames matched templates. There is also some kind histogram idea which doesn't seem to work out due to the ambigiuous nature of the problem.
- <b>PCA</b>: Seems to be the ordinary reduce dimensions and then compare against training data procedure. Not fantastically interesting.
- <b>Boosting</b>: Very vague description in this paragraph. Seems to describe a boosting approach to clustering or using hiearchial trees. Again problems with ambigiuity and lightning conditions.
-<b> Contour and silhouette matching</b>: Sort of a repitition of the detection chapter. Very much based on template matching again. Biggest problem is again ambiguity and clutter. There seems to be an idea to use the matching to restrict the area where the recognition is using contours and then use the silhouette to match. Again the approach is the obvious combine features...
- <b>Model-based recognition methods</b>. Starts out with some obvious statements such that the classification success depends on choosing the right features. Who would have known...They also cite some paper that has evaluated features and figured out that velocity features are...}
}
@inproceedings{Rother:2002wn,
author = {Rother, Carsten},
title = {{A new approach to vanishing point detection in architectural environments}},
booktitle = {Image and Vision Computing},
year = {2002},
pages = {647--655},
organization = {Royal Inst Technol, KTH, Computat Vis {\&} Act Percept Lab, CVAP, S-10044 Stockholm, Sweden}
}
@article{Donahue:2014ut,
author = {Donahue, Jeff and Hendricks, Lisa Anne and Guadarrama, Sergio and Rohrbach, Marcus and Venugopalan, Subhashini and Saenko, Kate and Darrell, Trevor J},
title = {{Long-term Recurrent Convolutional Networks for Visual Recognition and Description}},
journal = {arXiv.org},
year = {2014},
eprint = {1411.4389v3},
eprinttype = {arxiv},
eprintclass = {cs.CV},
month = nov
}
@inproceedings{Hu:2014eu,
author = {Hu, Junlin and Lu, Jiwen and Tan, Yap-Peng},
title = {{Discriminative Deep Metric Learning for Face Verification in the Wild}},
booktitle = {Computer Vision and Pattern Recognition (CVPR), 2014 IEEE Conference on},
year = {2014},
pages = {1875--1882}
}
@article{Provost:2001tu,
author = {Provost, J and Beeson, P and Kuipers, Benjamin J},
title = {{Toward learning the causal layer of the spatial semantic hierarchy using SOMs}},
journal = {{\ldots} Symposium Workshop on Learning {\ldots}},
year = {2001},
annote = {Summary:
Deals with SSH abstraction. Especiially the SSH causal layer. The causal layer deals with sensor views and control actions, and how they affect each other. They use a SOM(Self-organizing Maps) for representing the SSH view set. This fits in with modelling everything as an abstract graph.
They have some good points in the SSH Causal Layer chapter of qualities of how to handle sensory input.
First they define a triple of edges {\&}lt;V,A,V'{\&}gt; such that action A taken under view V indicates V' will happen.
They state that a robot must be able to recognize its current sensor input as one of its set of known views. This means that views must be clustered or at least be discriminated but this is too hard given the noisy input. Therefor they choose to formulate the problem as maximization of the predictive accurace of the {\&}lt;V,A,V'{\&}gt; relations, i.e., the confidence it will see the view V' after taking action A in view V.
Take home message seems to be to reformulate the recognition problem as a relation maximization problem since then one does not have to deal with the infinite space of possible noisy inputs.
<b>Relation to my work:</b> possibly how we can formulate the problem as relational problem rather than view causality learning problem. <b>This thought could be expanded upon.</b>
}
}
@inproceedings{Dindo:2010fr,
author = {Dindo, H and Zambuto, D},
title = {{A probabilistic approach to learning a visually grounded language model through human-robot interaction}},
booktitle = {2010 IEEE/RSJ International Conference on Intelligent Robots and Systems},
year = {2010},
pages = {790--796}
}
@article{Hendrich:2014tz,
author = {Hendrich, N and Bernardino, A},
title = {{Affordance-Based Grasp Planning for Anthropomorphic Hands from Human Demonstration - Springer}},
journal = {ROBOT2013: First Iberian Robotics {\ldots}},
year = {2014}
}
@article{Thrun:2000jv,
author = {Thrun, Sebastian},
title = {{Probabilistic Algorithms and the Interactive Museum Tour-Guide Robot Minerva}},
journal = {The International Journal of Robotics Research},
year = {2000},
volume = {19},
number = {11},
pages = {972--999},
month = nov
}
@inproceedings{Steder:2011bm,
author = {Steder, B and Rusu, R B and Konolige, K and Burgard, Wolfram},
title = {{Point feature extraction on 3D range scans taking into account object boundaries}},
booktitle = {2011 IEEE International Conference on Robotics and Automation},
year = {2011},
pages = {2601--2608}
}
@article{Jaakkola:pDo29F5A,
author = {Jaakkola, Tommi S},
title = {{Jaakkola NIPS 2000 Tutorial}}
}
@inproceedings{Sahbani:2009hd,
author = {Sahbani, Anis and El-Khoury, Sahar},
title = {{A hybrid approach for grasping 3D objects}},
booktitle = {2009 IEEE/RSJ International Conference on Intelligent Robots and Systems},
year = {2009},
pages = {1272--1277},
annote = {
<b>Summary</b>
Segement perfect 3D object models using a segmentation algorithm based upon Gaussian curvature and concaveness. An object is represented using superquadratics. The segementation is such that 7 differerent superquadratics are used for each object.
They then label a superquadratic for each object as the graspable part. They train a Neural Network on the labeled data.
To generate a grasps they do anlytical computations on the detected graspable part. The analytical parts are a force-closure test and a handkinematics test.
No real data is tested. Paper was before Kinect came out.
}
}
@article{Lazebnik:2005he,
author = {Lazebnik, S and Schmid, C and Ponce, J},
title = {{A sparse texture representation using local affine regions}},
journal = {Pattern Analysis and Machine Intelligence, IEEE Transactions on},
year = {2005},
volume = {27},
number = {8},
pages = {1265--1278}
}
@inproceedings{Claassens:2012kh,
author = {Claassens, J and Demiris, Y},
title = {{Exploiting affordance symmetries for task reproduction planning}},
booktitle = {Humanoid Robots (Humanoids), 2012 12th IEEE-RAS International Conference on},
year = {2012},
pages = {653--659}
}
@inproceedings{Kroemer:2012hi,
author = {Kroemer, O and Ugur, E and Oztop, E and Peters, J},
title = {{A kernel-based approach to direct action perception}},
booktitle = {2012 IEEE International Conference on Robotics and Automation},
year = {2012},
pages = {2605--2610}
}
@article{Kohli:2008wx,
author = {Kohli, Pushmeet and Rihan, J and Bray, M and Torr, PHS},
title = {{Simultaneous Segmentation and Pose Estimation of Humans Using Dynamic Graph Cuts - Springer}},
journal = {International Journal of Computer {\ldots}},
year = {2008}
}
@article{Remolina:2004km,
author = {Remolina, Emilio and Kuipers, Benjamin J},
title = {{Towards a general theory of topological maps}},
journal = {Artificial Intelligence Review},
year = {2004},
volume = {152},
number = {1},
pages = {47--104},
month = jan,
annote = {<b>Summary:</b> Too much toplogical map and logic stuff to be worth reading. Doubtful if it contains much information.}
}
@inproceedings{Kazemi:2014he,
author = {Kazemi, Vahid and Sullivan, Josephine},
title = {{One Millisecond Face Alignment with an Ensemble of Regression Trees}},
booktitle = {Computer Vision and Pattern Recognition (CVPR), 2014 IEEE Conference on},
year = {2014},
pages = {1867--1874}
}
@article{Shlens:2014vi,
author = {Shlens, Jonathon},
title = {{A Tutorial on Principal Component Analysis}},
journal = {arXiv.org},
year = {2014},
month = apr
}
@inproceedings{Xue:2009vx,
author = {Xue, Zhixing and Kasper, A and Zoellner, J M and Dillmann, R},
title = {{An automatic grasp planning system for service robots}},
booktitle = {Advanced Robotics, 2009. ICAR 2009. International Conference on},
year = {2009},
pages = {1--6}
}
@inproceedings{Claassens:2011gp,
author = {Claassens, J and Demiris, Y},
title = {{Generalising human demonstration data by identifying affordance symmetries in object interaction trajectories}},
booktitle = {2011 IEEE/RSJ International Conference on Intelligent Robots and Systems},
year = {2011},
pages = {1980--1985}
}
@article{Ginestet:2010dd,
author = {Ginestet, Cedric},
title = {{Introduction to Statistical Relational Learning}},
journal = {Journal of the Royal Statistical Society: Series A (Statistics in Society)},
year = {2010},
volume = {173},
number = {4},
pages = {934--935},
month = sep
}
@article{Biederman:1987bx,
author = {Biederman, Irving},
title = {{Recognition-by-components: A theory of human image understanding.}},
journal = {Psychological review},
year = {1987},
volume = {94},
number = {2},
pages = {115--117}
}
@article{Cheng:2001kp,
author = {Cheng, H D and Jiang, X H and Sun, Y and Wang, Jingli},
title = {{Color image segmentation: advances and prospects}},
journal = {Pattern Recognition},
year = {2001},
volume = {34},
number = {12},
pages = {2259--2281},
month = dec
}
@article{He:2015vx,
author = {He, Kaiming and Zhang, Xiangyu and Ren, Shaoqing and Sun, Jian},
title = {{Delving Deep into Rectifiers: Surpassing Human-Level Performance on ImageNet Classification}},
journal = {arXiv.org},
year = {2015},
eprint = {1502.01852v1},
eprinttype = {arxiv},
eprintclass = {cs.CV},
month = feb
}
@article{Hastie:2000up,
author = {Hastie, T and Tibshirani, R and Eisen, M B and Alizadeh, A},
title = {{Gene shaving'as a method for identifying distinct sets of genes with similar expression patterns}},
journal = {Genome {\ldots}},
year = {2000}
}
@article{Torralba:2003im,
author = {Torralba, Antonio},
title = {{Contextual Priming for Object Detection - Springer}},
journal = {International Journal of Computer Vision},
year = {2003},
volume = {53},
number = {2},
pages = {169--191}
}
@article{Kruger:2011bj,
author = {Kr{\"u}ger, Norbert and Geib, Christopher and Piater, Justus and Petrick, Ronald and Steedman, Mark and W{\"o}rg{\"o}tter, Florentin and Ude, Ale{\v s} and Asfour, Tamim and Kraft, Dirk and Omr{\v c}en, Damir and Agostini, Alejandro and Dillmann, R{\"u}diger},
title = {{Object--Action Complexes: Grounded abstractions of sensory--motor processes}},
journal = {Robotics and Autonomous Systems},
year = {2011},
volume = {59},
number = {10},
pages = {740--757},
month = oct
}
@article{Tsai:uy,
author = {Tsai, G and Kuipers, Benjamin J},
title = {{Focusing Attention on Visual Features that Matter}},
journal = {eecs.umich.edu
}
}
@article{Chopra:2005jh,
author = {Chopra, Sumit and Hadsell, Raia and LeCun, Yann},
title = {{Learning a Similarity Metric Discriminatively, with Application to Face Verification.}},
journal = {CVPR},
year = {2005},
pages = {539--546}
}
@article{QuinoneroCandela:2005wp,
author = {Qui{\~n}onero-Candela, Joaquin and Rasmussen, Carl Edward},
title = {{A unifying view of sparse approximate Gaussian process regression}},
journal = {Journal of Machine Learning Research},
year = {2005},
volume = {6},
pages = {1939--1959}
}
@book{Bishop:2006ui,
author = {Bishop, Christopher M},
title = {{Pattern Recognition and Machine Learning}},
publisher = {Springer-Verlag New York, Inc.},
year = {2006}
}
@book{MacKay:b7_kxpTs,
author = {MacKay, David},
title = {{Information Theory, Inference, and Learning Algorithms}}
}
@inproceedings{Hendrich:2010hx,
author = {Hendrich, N and Klimentjew, D and Zhang, Jianwei},
title = {{Multi-sensor based segmentation of human manipulation tasks}},
booktitle = {Multisensor Fusion and Integration for Intelligent Systems (MFI), 2010 IEEE Conference on},
year = {2010},
pages = {223--229}
}
@article{Bernardo:2008tm,
author = {Bernardo, J M and Bayarri, M J and Berger, J O and Dawid, A P},
title = {{Density Modeling and Clustering Using Dirichlet Diffusion Trees}},
year = {2008}
}
@book{Laub:2005wt,
author = {Laub, Alan J},
title = {{Matrix Analysis for Scientists and Engineers}},
publisher = {Siam},
year = {2005}
}
@article{Csato:2002tz,
author = {Csat{\'o}, Lehel and Opper, Manfred},
title = {{Sparse on-line Gaussian processes}},
journal = {Neural Computation},
year = {2002},
volume = {14},
number = {3},
month = mar
}
@article{Welch:nModKeqF,
author = {Welch, Greg and Bishop, Gary},
title = {{An Introduction to the Kalman Filter}}
}
@article{Fox:1997ed,
author = {Fox, Dieter and Burgard, Wolfram and Thrun, Sebastian},
title = {{The dynamic window approach to collision avoidance}},
journal = {IEEE Robotics {\&} Automation Magazine},
year = {1997},
volume = {4},
number = {1},
pages = {23--33},
month = mar
}
@article{Ekvall:2005ue,
author = {Ekvall, S and Kragic, Danica},
title = {{Grasp Recognition for Programming by Demonstration}},
journal = {{\ldots} },
year = {2005}
}
@article{Ohagan:1994tw,
author = {O'hagan, Anthony and VEENSTRA, RH and Vanbatenburg and Pc and Pc},
title = {{Bayesian Discovery Sampling in Financial Auditing - a Hierarchical Prior Model for Substantive Test Sample Sizes}},
journal = {Statistician},
year = {1994},
volume = {43},
number = {1},
pages = {99--110}
}
@proceedings{Tighe:y1TUmcTG,
title = {{Finding Things: Image Parsing with Regions and Per-Exemplar Detectors}}
}
@article{Sahin:2007gr,
author = {Sahin, E and Cakmak, M and Dogar, M R and Ugur, E and Ucoluk, G},
title = {{To Afford or Not to Afford: A New Formalization of Affordances Toward Affordance-Based Robot Control}},
journal = {Adaptive Behavior},
year = {2007},
volume = {15},
number = {4},
pages = {447--472},
month = dec
}
@inproceedings{BarckHolst:2009uy,
author = {Barck-Holst, C and Ralph, M and Holmar, F and Kragic, Danica},
title = {{Learning grasping affordance using probabilistic and ontological approaches}},
booktitle = {Advanced Robotics, 2009. ICAR 2009. International Conference on},
year = {2009},
pages = {1--6}
}
@article{Tsai:2012vk,
author = {Tsai, G and Kuipers, Benjamin J},
title = {{Dynamic visual understanding of the local environment for an indoor navigating robot}},
journal = {Intelligent Robots and Systems (IROS)},
year = {2012}
}
@inproceedings{Detry:2012bp,
author = {Detry, Renaud and Ek, Carl Henrik and Madry, Marianna and Piater, Justus and Kragic, Danica},
title = {{Generalizing grasps across partly similar objects}},
booktitle = {2012 IEEE International Conference on Robotics and Automation},
year = {2012},
pages = {3791--3797},
publisher = {IEEE}
}
@techreport{Haines:EPp9vr3r,
author = {Haines, Tom},
title = {{Gaussian Conjugate Prior Cheat Sheet}}
}
@techreport{Schon:xcYovD6r,
author = {Sch{\"o}n, Thomas and Lindsten, Fredrik},
title = {{Manipulating the Multivariate Gaussian Density}}
}
@article{Ciocarlie:2009tn,
author = {Ciocarlie, Matei T and Allen, Peter K},
title = {{Hand Posture Subspaces for Dexterous Robotic Grasping}},
journal = {The International Journal of Robotics Research},
year = {2009},