If you roll the dice 60,000 times, it will be close to 10,000 each. Let's apply this to Lotto 6 and increase the probability of hitting Lotto 6 a little.
from bs4 import BeautifulSoup
import requests
from urllib.request import urlopen
import re
import pandas as pd
import numpy as np
def oldurl():
ulist=[]
for a in range(60001,60442,20):
url='https://www.mizuhobank.co.jp/retail/takarakuji/loto/backnumber/loto' + str(a) +'.html'
ulist.append(url)
return ulist
def setdb_first():
ulist=oldurl()
lolist=[]
for url in ulist:
r = requests.get(url)
r.encoding = r.apparent_encoding
soup = BeautifulSoup(r.text, "html.parser")
table=soup.findAll("table", {"class":"typeTK"})
if len(table):
table =table[0]
table=str(table)
pdtable=pd.read_html(table) #to pandas
for i in pdtable[0].itertuples():
i=list(i)
i=i[1:]
i[0]=int(re.findall('\d+', i[0])[0]) #get
datelist=re.findall('\d+', i[1])
datelist[1]=str(datelist[1]).zfill(2)
datelist[2]=str(datelist[2]).zfill(2)
i[1]=int(''.join(datelist))
lolist.append(i)
#print(i)
else:
print('set db: failed ')
print('no data:')
return False
lonp=np.array(lolist)
np.save('oldlo', lonp)
def setdb_second(start):
newlo=[]
cnt=0
while True:
cnt+=1
times=str(start+cnt).zfill(4)
r = requests.get('https://www.mizuhobank.co.jp/retail/takarakuji/loto/loto6/csv/A102'+times+'.CSV')
r.encoding = r.apparent_encoding
soup = BeautifulSoup(r.text, "html.parser")
regex=re.compile("(\d+)[,](\d+)[,](\d+)[,](\d+)[,](\d+)[,](\d+)[,]\w+[,](\d+)")
lolist=[(start+cnt)]
soup=str(soup)
result=regex.search(soup)
if result:
for a in range(1,8,1):
lolist.append(result.group(a))
newlo.append(lolist)
else:
break
if (cnt%10)==0:
print('complete: ',start+cnt)
lonp=np.array(newlo)
np.save('newlo', lonp)
print(lonp)
def update():
before=np.load('newlo.npy',allow_pickle=True)
start=before.shape[0]+460 #460>old times
newlo=[]
cnt=0
while True:
cnt+=1
times=str(start+cnt).zfill(4)
r = requests.get('https://www.mizuhobank.co.jp/retail/takarakuji/loto/loto6/csv/A102'+times+'.CSV')
r.encoding = r.apparent_encoding
soup = BeautifulSoup(r.text, "html.parser")
regex=re.compile("(\d+)[,](\d+)[,](\d+)[,](\d+)[,](\d+)[,](\d+)[,]\w+[,](\d+)")
lolist=[(start+cnt)]
soup=str(soup)
result=regex.search(soup)
if result:
print("updated! :",times,"th")
for a in range(1,8,1):
lolist.append(result.group(a))
newlo.append(lolist)
else:
break
if (cnt%10)==0:
print('complete: ',start+cnt)
if cnt==1:
print("Nothing to update")
else:
lonp=np.array(newlo)
sumlo=np.concatenate((before,lonp), axis=0)
np.save('newlo', sumlo)
def freq(loset,times): #frequently to times
lo=loset[:times,1:7]
unique, counts=np.unique(lo,return_counts=True)
counts=np.asarray(counts)
unique=np.asarray(unique)
unique.resize(1,counts.shape[0])
i=np.argsort(counts)[::-1]
c=unique[:,i]
print("total of lotto6: ",times)
tmp=0
frq=c[0,:]
nums=np.sort(counts)[::-1]
for a in range(43):
check='no.'+str(a+1)+ ' > '+str(frq[a])+':'+str(nums[a])+' times'
print(check)
return c[0,:]
def freqs(li):
li=np.array(li)
unique, counts=np.unique(li,return_counts=True)
counts=np.asarray(counts)
unique=np.asarray(unique)
unique.resize(1,counts.shape[0])
i=np.argsort(counts)[::-1]
c=unique[:,i]
def scen(loset,times,stand): #frequently from times,0-42>1-43
checkset=loset[times:,:]#1000>1001-
cnt=0
yn=[0,0,0]
scontlist=[]
mcountlist=[]
for a in checkset:
sdata=freq(loset,times+cnt)
cont=0
min=42
for b in a[1:7]:
#print(b)
loc = np.where(sdata == b)
if loc[1][0]<min:
min=loc[1][0]
if loc[1][0]>stand:
cont+=1
scontlist.append(cont)
mcountlist.append(min)
if min>stand:
yn[0]+=1
else:
yn[1]+=1
cnt+=1
freqs(mcountlist)
return yn
def select(li,pick):
selnum=[]
cnt=0
while True:
ran=np.random.randint(0,li.size,1)
try:
selnum.index(ran[0])
except:
selnum.append(ran[0])
cnt+=1
if cnt==pick:
break
cnt=0
for a in selnum:
selnum[cnt]=li[selnum[cnt]]
cnt+=1
return selnum
def choose(flist,ign,topn,topc):
flist=flist[ign:]
result=select(flist[:topn],topc)
print("list: ",flist[:topn].shape[0],flist[:topn],result)
return result
def dupli(li,pick):
li=li[:,1:7]
#print(li[3])
i=np.argsort(pick)
pick=pick[i]
#pick=np.array([16,18,26,27,34,40])
result=np.where((li == pick).all(axis=1))
if result[0].size!=0:
print("Wow! it was", result[0],"th")
print("Try again!!")
return False
return True
def checksave(sumlo,li):
regex=re.compile("(\d+)\D+(\d+)\D+(\d+)\D+(\d+)\D+(\d+)\D+(\d+)\D+(\d+)")
futurehope="\n"+str(sumlo[-1,0]+1) + str(li)
with open('past.txt', 'r+') as f:
d = f.readlines()
f.seek(0)
for i in d:
#print(i)
if len(i)<2:
print('')
elif (i.find('hit') == -1):
result=regex.search(i)
cnt=0
hope=[]
besix=[]
for a in range(1,8,1):
hope.append(int(result.group(a)))
#print("test:",hope)
## completely check
if sumlo[-1,0]<hope[0]:
f.write(i)
break
if sumlo[hope[0]-1,0]!=hope[0]:
print("not times matech")
print(tt)
##
for a in range(6):
hit=np.where(sumlo[hope[0]-1,1:]==hope[a])
if hit[0].size!=0:
cnt+=1
besix.append(hope[a])
output=str(hope[0])+'/ '+ str(cnt) +'hit /'+str(hope[1:7])+'/'+str(sumlo[hope[0]-1,1:7])+'/'+str(besix)
#print(output)
print("Bless you: ",output)
f.write('%s\n' %output)
#f.write('%s\n' %output)
else:
f.write(i)
f.write(futurehope)
#if (string.find(CentoOS') != -1):
#setdb_first()
#setdb_second(460)
try:
oldlo=np.load('oldlo.npy',allow_pickle=True)
except:
setdb_first()
setdb_second(460)
oldlo=np.load('oldlo.npy',allow_pickle=True)
oldlo=np.delete(oldlo,1,1)
update()
newlo=np.load('newlo.npy',allow_pickle=True)
sumlo=np.concatenate((oldlo,newlo), axis=0)
sumlo=sumlo.astype('int16')
total=sumlo.shape[0]
#print("Total: ", total)
pri=freq(sumlo,total)# 1~3
#######for simulation
start_times=1000
#print(sumlo.shape)
#print(sumlo[0:4])
#######for simulation
ruckynum=5 #0 to 10
first=choose(pri,2,10+ruckynum,2) # no.3~17, in15 pick 2
second=choose(pri,12+ruckynum,28,4) # no.18~43, in26 pick 4
pick=np.hstack([first,second])
i=np.argsort(pick)
pick=pick[i]
if dupli(sumlo,pick):
checksave(sumlo,pick)
print('good luck: ',pick)
Recommended Posts