Skip to content

Commit

Permalink
aliviando el area de trabajo
Browse files Browse the repository at this point in the history
  • Loading branch information
JuanVentrone committed Jun 17, 2020
1 parent dcb19e9 commit d72e8a2
Show file tree
Hide file tree
Showing 6 changed files with 221 additions and 15 deletions.
4 changes: 4 additions & 0 deletions Main.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,3 +4,7 @@
from Python import Scrapper_Blockchain_Func as sf
from Python import procces_table as pt


sf.scrapper_update()

pt.concat_lost_block()
6 changes: 3 additions & 3 deletions Python/Scrapper_Blockchain_Func.py
Original file line number Diff line number Diff line change
Expand Up @@ -71,14 +71,14 @@ def block_scrapper_pages(n_pages_1,n_range_block):
try:
url_pages=requests.get(url_pages)
if url_pages.status_code==200:
print("entro a la URL")
print("BLoques buscados: ",n_range_block)
# Scrapping the mean Page --- Escrapeo la pagina principal

sopa=BeautifulSoup(url_pages.text, "html5lib")

links=sopa.find_all("a",attrs={"class":"sc-1r996ns-0 gzrtQD sc-1tbyx6t-1 kXxRxe iklhnl-0 boNhIO"})
links_blocks=[link.get("href") for link in links]
print(len(links))




Expand Down Expand Up @@ -200,7 +200,7 @@ def scrapper_update():
# Scrapper Innit

df,dr= block_scrapper_pages(n_pages,n_range_block)
if dr==[]:table_save_update(df,data_old)
if dr==[]:df_suma=table_save_update(df,data_old)
else:
df_new=last_scrpapping(df,dr,n_range_block)
df_suma=table_save_update(df_new,data_old)
Expand Down
Binary file modified Python/__pycache__/Scrapper_Blockchain_Func.cpython-37.pyc
Binary file not shown.
Binary file modified Python/__pycache__/procces_table.cpython-37.pyc
Binary file not shown.
196 changes: 192 additions & 4 deletions Python/data_table.ipynb

Large diffs are not rendered by default.

30 changes: 22 additions & 8 deletions Python/procces_table.py
Original file line number Diff line number Diff line change
Expand Up @@ -6,19 +6,21 @@




def n_block():
stats=sf.blockchain_stats()
return stats.get("n_blocks_total")

def rango_b(a,b,i,block_f,lista_height):

while a==lista_height[i]:
if a==b:return print("Hemos Finalizado")
if a==b:return print("Finalizo la Busqueda de Bloques no escrapeados")
a+=1
i+=1
block_f.append([a,lista_height[i]])
return rango_b(lista_height[i],b,i,block_f,lista_height)

a=lista_height[i]
print(a)
return rango_b(a,b,i,block_f,lista_height)


def process(block_f):
Expand All @@ -27,8 +29,8 @@ def process(block_f):
total=n_block()
for i in block_f:

a=math.ceil((total-i[0])/50+2)
b=math.ceil((total-i[1])/50-1)
a=math.ceil(((total-i[0])/50)+2)
b=math.ceil(((total-i[1])/50)-1)
page_url_list.append({"Ini Page":b,"Final Page":a,"I block":i[0],"F block":i[1]})

return page_url_list
Expand All @@ -41,7 +43,6 @@ def find_lost_block():
a=min(lista_height)
b=max(lista_height)
block_f=[]
c=0
i=0
rango_b(a,b,i,block_f,lista_height)

Expand All @@ -50,7 +51,6 @@ def find_lost_block():
df_error_pages.to_csv("blockchain data/bc data/rang_lost_blocks.csv")

# si deseas activar un escrappeo inmediato

# r=str(input("El Proceso se realizo exitosamente!,¿Desea Scrappear los Bloques Faltantes,?,Presione cualquier tecla"))
# if r!="":sf.scrapper_lost_block()

Expand All @@ -73,7 +73,10 @@ def uni_table(direc):
return data

def read_data():
data=pd.read_csv("blockchain data/bc data/old data/data_crudo.csv")
direc="blockchain data/bc data/old data/data_crudo_1.csv"
print(direc)
data=pd.read_csv(direc)

data.drop(data.columns[data.columns.str.contains('unnamed',case = False)],axis = 1, inplace = True)
return data

Expand Down Expand Up @@ -119,6 +122,17 @@ def partition_lost_bock():
data_temp=data[i[0]:i[1]]
data_temp.to_csv("blockchain data/bc data/lost range data/lost_blocks"+str(i[0])+"_"+str(i[1])+".csv")

def partition_data_crudo():

data=pd.read_csv("blockchain data/bc data/old data/data_crudo.csv")
x=int(len(data)/2)
data_1=data[x:]
data_2=data[:x]
data_1.to_csv("blockchain data/bc data/old data/data_crudo_1.csv")
data_2.to_csv("blockchain data/bc data/old data/data_crudo_2.csv")





# Codigo Creado por Juan Vicente Ventrone
Expand Down

0 comments on commit d72e8a2

Please sign in to comment.