%Aigaion2 BibTeX export from Idiap Publications %Thursday 21 November 2024 12:54:16 PM @INPROCEEDINGS{chen-icpr02, author = {Chen, Datong and Odobez, Jean-Marc and Bourlard, Herv{\'{e}}}, projects = {Idiap}, month = {10}, title = {{T}ext {S}egmentation and {R}ecognition in {C}omplex {B}ackground {B}ased on {M}arkov {R}andom {F}ield}, booktitle = {Int. Conf. Pattern Recognition 2002}, year = {2002}, institution = {IDIAP}, address = {Quebec city, Canada}, crossref = {chen-0217}, abstract = {In this paper we propose a method to segment and recognize text embedded in video and images. We modelize the gray level distribution in the text images as mixture of gaussians, and then assign each pixel to one of the gaussian layer. The assignment is based on prior of the contextual information, which is modeled by a Markov random field (MRF) with online estimated coefficients. Each layer is then processed through a connected component analysis module and forwarded to the OCR system as one segmentation hypothesis. By varying the number of gaussians, multiple hypotheses are provided to an OCR system and the final result is selected from the set of outputs, leading to an improvement of the system's performances.}, pdf = {https://publications.idiap.ch/attachments/reports/2002/rr-02-17.pdf}, postscript = {ftp://ftp.idiap.ch/pub/reports/2002/rr-02-17.ps.gz}, ipdmembership={vision}, } crossreferenced publications: @TECHREPORT{chen-0217, author = {Chen, Datong and Odobez, Jean-Marc and Bourlard, Herv{\'{e}}}, projects = {Idiap}, month = {4}, title = {{T}ext {S}egmentation and {R}ecognition in {C}omplex {B}ackground Based on Markov Random Field}, type = {Idiap-RR}, booktitle = {Int. Conf. Pattern Recognition 2002}, number = {Idiap-RR-17-2002}, year = {2002}, institution = {IDIAP}, note = {Published in Proceedings of the Int. Conf. Pattern Recognition 2002}, abstract = {In this paper we propose a method to segment and recognize text embedded in video and images. We modelize the gray level distribution in the text images as mixture of gaussians, and then assign each pixel to one of the gaussian layer. The assignment is based on prior of the contextual information, which is modeled by a Markov random field (MRF) with online estimated coefficients. Each layer is then processed through a connected component analysis module and forwarded to the OCR system as one segmentation hypothesis. By varying the number of gaussians, multiple hypotheses are provided to an OCR system and the final result is selected from the set of outputs, leading to an improvement of the system's performances.}, pdf = {https://publications.idiap.ch/attachments/reports/2002/rr-02-17.pdf}, postscript = {ftp://ftp.idiap.ch/pub/reports/2002/rr-02-17.ps.gz}, ipdmembership={vision}, }