Pankaj Gulhane, Rajeev Rastogi, Srinivasan H. Sengamedu, Ashwin Tengli. Exploiting Content Redundancy for Web Information Extraction. PVLDB, 3(1):578-587, 2010. [doi]
@article{GulhaneRST10, title = {Exploiting Content Redundancy for Web Information Extraction}, author = {Pankaj Gulhane and Rajeev Rastogi and Srinivasan H. Sengamedu and Ashwin Tengli}, year = {2010}, url = {http://www.comp.nus.edu.sg/~vldb2010/proceedings/files/papers/R51.pdf}, tags = {redundancy}, researchr = {https://researchr.org/publication/GulhaneRST10}, cites = {0}, citedby = {0}, journal = {PVLDB}, volume = {3}, number = {1}, pages = {578-587}, }