%Aigaion2 BibTeX export from Idiap Publications %Friday 11 October 2024 01:51:16 AM @INPROCEEDINGS{gatica02a-conf, author = {Gatica-Perez, Daniel and Sun, Ming-Ting and Loui, Alexander}, projects = {Idiap}, title = {Probabilistic Home Video Structuring: Feature Selection and Performance Evaluation}, booktitle = {IEEE International Conference on Image Processing}, year = {2002}, crossref = {gatica02a}, abstract = {We recently proposed a method to find cluster structure in home videos based on statistical models of visual and temporal features of video segments and sequential binary Bayesian classification. In this paper, we present analysis and improved results on two key issues: feature selection and performance evaluation, using a ten-hour database (30 video clips, 1,075,000 frames). From multiple features and similarity measures, visual features are selected in order to minimize the empirical probability of misclassification. Temporal features are chosen to reflect the patterns existing in both shot and cluster duration and adjacency. Finally, we describe a detailed performance evaluation procedure that includes cluster detection, individual shot-cluster labeling, and prior selection.}, pdf = {https://publications.idiap.ch/attachments/reports/2002/rr02-11.pdf}, postscript = {ftp://ftp.idiap.ch/pub/reports/2002/rr02-11.ps.gz}, ipdmembership={vision}, } crossreferenced publications: @TECHREPORT{gatica02a, author = {Gatica-Perez, Daniel and Sun, Ming-Ting and Loui, Alexander}, projects = {Idiap}, title = {Probabilistic Home Video Structuring: Feature Selection and Performance Evaluation}, type = {Idiap-RR}, number = {Idiap-RR-11-2002}, year = {2002}, institution = {IDIAP}, abstract = {We recently proposed a method to find cluster structure in home videos based on statistical models of visual and temporal features of video segments and sequential binary Bayesian classification. In this paper, we present analysis and improved results on two key issues: feature selection and performance evaluation, using a ten-hour database (30 video clips, 1,075,000 frames). From multiple features and similarity measures, visual features are selected in order to minimize the empirical probability of misclassification. Temporal features are chosen to reflect the patterns existing in both shot and cluster duration and adjacency. Finally, we describe a detailed performance evaluation procedure that includes cluster detection, individual shot-cluster labeling, and prior selection.}, pdf = {https://publications.idiap.ch/attachments/reports/2002/rr02-11.pdf}, postscript = {ftp://ftp.idiap.ch/pub/reports/2002/rr02-11.ps.gz}, ipdmembership={vision}, }