From db7e8378cc99ec779789d747501280af3ebc7776 Mon Sep 17 00:00:00 2001
From: Sebastian Colombo <colombosebas@gmail.com>
Date: Tue, 2 May 2023 18:54:53 -0300
Subject: [PATCH] Reto #18 python

---
 .../python/colombosebas.py"                   | 40 +++++++++++++++++++
 1 file changed, 40 insertions(+)
 create mode 100644 "Retos/Reto #18 - WEB SCRAPING [Dif\303\255cil]/python/colombosebas.py"

diff --git "a/Retos/Reto #18 - WEB SCRAPING [Dif\303\255cil]/python/colombosebas.py" "b/Retos/Reto #18 - WEB SCRAPING [Dif\303\255cil]/python/colombosebas.py"
new file mode 100644
index 0000000000..c18c23d6b0
--- /dev/null
+++ "b/Retos/Reto #18 - WEB SCRAPING [Dif\303\255cil]/python/colombosebas.py"	
@@ -0,0 +1,40 @@
+import requests
+from bs4 import BeautifulSoup
+import xml.etree.ElementTree as ET
+
+# Bueno es un poco rebuscado pero salió, basicamente lo que hago es obtener todo el html de la web y luego lo analizo con el ElementTree
+# lo que hago es ir viendo como estan formados los textos del xml y en base a eso veo que muestro y que no. Cualquier cambio en la web
+# podría llegar a romper el correcto funcionamiento de este algoritmo.
+# Seguramente alguno encontró una manera más simple de hacerlo :)
+
+url = 'https://holamundo.day'
+response = requests.get(url)
+soup = BeautifulSoup(response.content, 'html.parser')
+html_str = soup.prettify()
+root = ET.fromstring(html_str)
+agenda8 = False
+cadena = ""
+
+for elem in root.iter():
+    texto = str(elem.text)
+    if agenda8 == False:
+        if ((texto.find("Agenda 8 de mayo") != -1) and (elem.tag == 'span')):
+            agenda8 = True
+            print("Agenda 8 de Mayo")
+        atributo = str(elem.attrib)
+    elif(elem.tag == 'span') and (atributo.find("data-slate-string") != -1):
+        texto2 = str(elem.text)
+        texto2 = texto2.replace(" ", "")
+        texto2 = texto2.strip()
+        if len(texto2) >= 1:
+            if texto2.startswith("1") or texto2.startswith("2"):
+                print(cadena)
+                cadena = texto2
+            else:
+                if texto2 == '|':
+                    cadena += " " + texto2
+                else:
+                    cadena += texto2
+           #print(f'Texto:{texto2.strip()}*')
+        if texto2.find("Despedida") != -1:
+            break