URL normalization for de-duplication of web pages

Amit Agarwal, Hema Swetha Koppula, Krishna P. Leela, Krishna Prasad Chitrapura, Sachin Garg, Pavan Kumar GM, Chittaranjan Haty, Anirban Roy, Amit Sasturkar. URL normalization for de-duplication of web pages. In David Wai-Lok Cheung, Il-Yeol Song, Wesley W. Chu, Xiaohua Hu, Jimmy J. Lin, editors, Proceedings of the 18th ACM Conference on Information and Knowledge Management, CIKM 2009, Hong Kong, China, November 2-6, 2009. pages 1987-1990, ACM, 2009. [doi]

@inproceedings{AgarwalKLCGGHRS09,
  title = {URL normalization for de-duplication of web pages},
  author = {Amit Agarwal and Hema Swetha Koppula and Krishna P. Leela and Krishna Prasad Chitrapura and Sachin Garg and Pavan Kumar GM and Chittaranjan Haty and Anirban Roy and Amit Sasturkar},
  year = {2009},
  doi = {10.1145/1645953.1646283},
  url = {http://doi.acm.org/10.1145/1645953.1646283},
  researchr = {https://researchr.org/publication/AgarwalKLCGGHRS09},
  cites = {0},
  citedby = {0},
  pages = {1987-1990},
  booktitle = {Proceedings of the 18th ACM Conference on Information and Knowledge Management, CIKM 2009, Hong Kong, China, November 2-6, 2009},
  editor = {David Wai-Lok Cheung and Il-Yeol Song and Wesley W. Chu and Xiaohua Hu and Jimmy J. Lin},
  publisher = {ACM},
  isbn = {978-1-60558-512-3},
}