This commit is contained in:
Jon Ander 2024-11-30 18:48:03 +01:00
parent 6768381bd0
commit 8d9092af03
5 changed files with 9 additions and 6 deletions

View File

@ -2,7 +2,7 @@
<module type="PYTHON_MODULE" version="4">
<component name="NewModuleRootManager">
<content url="file://$MODULE_DIR$" />
<orderEntry type="jdk" jdkName="Python 3.13" jdkType="Python SDK" />
<orderEntry type="jdk" jdkName="Python 3.11" jdkType="Python SDK" />
<orderEntry type="sourceFolder" forTests="false" />
</component>
</module>

View File

@ -3,5 +3,5 @@
<component name="Black">
<option name="sdkName" value="Python 3.13" />
</component>
<component name="ProjectRootManager" version="2" project-jdk-name="Python 3.13" project-jdk-type="Python SDK" />
<component name="ProjectRootManager" version="2" project-jdk-name="Python 3.11" project-jdk-type="Python SDK" />
</project>

0
ejercicios/__init__.py Normal file
View File

View File

@ -0,0 +1,3 @@
from ejercicios.paralelismo02.ej01.ej01 import MiScraping
hilo = MiScraping("")

View File

@ -4,16 +4,16 @@ from bs4 import BeautifulSoup
import re
class MiScraping(threading.Thread):
def __init__(self,url):
threading.Thread.__init__(self)
self.url = url
self.links =[]
def run(self):
# self.url coge el "url" que se le pase al constructor a la hora de llamar al metodo
response = requests.get(self.url)
soup = BeautifulSoup(response.text,"html.parser")
self.links = [a['href'] for a in soup.find_all('a', href=True) if re.match(r'http[s]?://', a['href'])]
def get_links(self):
return self.links