1. def html_hash(html_string):
  2. """
  3. Generates a simple hash of an HTML document string.
  4. For development purposes only. Not cryptographically secure.
  5. """
  6. hash_value = 0
  7. for char in html_string:
  8. hash_value = (hash_value * 31 + ord(char)) % (2**32) # Simple polynomial hash
  9. return hash_value
  10. if __name__ == '__main__':
  11. html_doc1 = """
  12. <!DOCTYPE html>
  13. <html>
  14. <head>
  15. <title>Example 1</title>
  16. </head>
  17. <body>
  18. <h1>Hello, world!</h1>
  19. </body>
  20. </html>
  21. """
  22. html_doc2 = """
  23. <!DOCTYPE html>
  24. <html>
  25. <head>
  26. <title>Example 2</title>
  27. </head>
  28. <body>
  29. <h1>Hello, world!</h1>
  30. </body>
  31. </html>
  32. """
  33. html_doc3 = """
  34. <!DOCTYPE html>
  35. <html>
  36. <head>
  37. <title>Example 3</title>
  38. </head>
  39. <body>
  40. <h2>Another heading</h2>
  41. </body>
  42. </html>
  43. """
  44. hash1 = html_hash(html_doc1)
  45. hash2 = html_hash(html_doc2)
  46. hash3 = html_hash(html_doc3)
  47. print(f"Hash of doc1: {hash1}")
  48. print(f"Hash of doc2: {hash2}")
  49. print(f"Hash of doc3: {hash3}")
  50. #Test case for empty string
  51. html_doc4 = ""
  52. hash4 = html_hash(html_doc4)
  53. print(f"Hash of doc4: {hash4}")

Add your comment