Compare commits

...

2 Commits

Author SHA1 Message Date
jon ander fad7ec7aa8 wip 2024-12-02 16:53:37 +01:00
Jon Ander 819bab2e5c wip 2024-12-02 13:58:51 +01:00
4 changed files with 8 additions and 4 deletions

View File

@ -2,7 +2,7 @@
<module type="PYTHON_MODULE" version="4"> <module type="PYTHON_MODULE" version="4">
<component name="NewModuleRootManager"> <component name="NewModuleRootManager">
<content url="file://$MODULE_DIR$" /> <content url="file://$MODULE_DIR$" />
<orderEntry type="jdk" jdkName="Python 3.11" jdkType="Python SDK" /> <orderEntry type="inheritedJdk" />
<orderEntry type="sourceFolder" forTests="false" /> <orderEntry type="sourceFolder" forTests="false" />
</component> </component>
</module> </module>

View File

@ -3,5 +3,5 @@
<component name="Black"> <component name="Black">
<option name="sdkName" value="Python 3.13" /> <option name="sdkName" value="Python 3.13" />
</component> </component>
<component name="ProjectRootManager" version="2" project-jdk-name="Python 3.11" project-jdk-type="Python SDK" /> <component name="ProjectRootManager" version="2" project-jdk-name="Python 3.13" project-jdk-type="Python SDK" />
</project> </project>

View File

@ -1,3 +1,7 @@
from ejercicios.paralelismo02.ej01.ej01 import MiScraping from ejercicios.paralelismo02.ej01.ej01 import MiScraping
hilo = MiScraping("") hilo = MiScraping("http://localhost:8000/portada.html")
hilo.start()
hilo.join()
links = hilo.get_links()
print(links)

View File

@ -11,7 +11,7 @@ class MiScraping(threading.Thread):
def run(self): def run(self):
response = requests.get(self.url) response = requests.get(self.url)
soup = BeautifulSoup(response.text,"html.parser") soup = BeautifulSoup(response.text,"html.parser")
self.links = [a['href'] for a in soup.find_all('a', href=True) if re.match(r'http[s]?://', a['href'])] self.links = [a['href'] for a in soup.find_all('a', href=True)]
def get_links(self): def get_links(self):
return self.links return self.links