Fixed a problem in model-training and renamed files
This commit is contained in:
parent
30cc846c6f
commit
5f0f9f1dce
78
discriminate.py
Normal file
78
discriminate.py
Normal file
@ -0,0 +1,78 @@
|
|||||||
|
import os
|
||||||
|
|
||||||
|
import torch
|
||||||
|
from torch import nn
|
||||||
|
from torch import nn, optim
|
||||||
|
from torch.utils.data import DataLoader
|
||||||
|
import numpy as np
|
||||||
|
import random
|
||||||
|
|
||||||
|
import shark
|
||||||
|
|
||||||
|
bs = int(256/8)
|
||||||
|
|
||||||
|
class Model(nn.Module):
|
||||||
|
def __init__(self):
|
||||||
|
super(Model, self).__init__()
|
||||||
|
self.lstm = nn.LSTM(
|
||||||
|
input_size=8,
|
||||||
|
hidden_size=16,
|
||||||
|
num_layers=3,
|
||||||
|
dropout=0.1,
|
||||||
|
)
|
||||||
|
self.fc = nn.Linear(16, 1)
|
||||||
|
self.out = nn.Sigmoid()
|
||||||
|
|
||||||
|
def forward(self, x, prev_state):
|
||||||
|
output, state = self.lstm(x, prev_state)
|
||||||
|
logits = self.fc(output)
|
||||||
|
val = self.out(logits)
|
||||||
|
#print(str(logits.item())+" > "+str(val.item()))
|
||||||
|
return val, state
|
||||||
|
|
||||||
|
def init_state(self, sequence_length):
|
||||||
|
return (torch.zeros(3, 1, 16),
|
||||||
|
torch.zeros(3, 1, 16))
|
||||||
|
|
||||||
|
def run(model, seq):
|
||||||
|
state_h, state_c = model.init_state(len(seq))
|
||||||
|
for i in range(len(seq)):
|
||||||
|
x = torch.tensor([[[float(d) for d in bin(seq[i])[2:].zfill(8)]]], dtype=torch.float32)
|
||||||
|
y_pred, (state_h, state_c) = model(x, (state_h, state_c))
|
||||||
|
|
||||||
|
#state_h = state_h.detach()
|
||||||
|
#state_c = state_c.detach()
|
||||||
|
|
||||||
|
return y_pred.item()
|
||||||
|
|
||||||
|
def score(model, ciphertext, hypothesis):
|
||||||
|
seq = shark.xor(ciphertext, hypothesis)
|
||||||
|
return run(model, seq)
|
||||||
|
|
||||||
|
def test_scoring(model):
|
||||||
|
length = 16
|
||||||
|
iv = shark.genIV()
|
||||||
|
|
||||||
|
# TODO: Generate human language
|
||||||
|
plaintext = os.urandom(length*bs)
|
||||||
|
plaintextAlt = os.urandom(length*bs)
|
||||||
|
|
||||||
|
plaintextSemi = [plaintext[s] if random.random()>0.5 else plaintextAlt[s] for s in range(length)]
|
||||||
|
|
||||||
|
ciphertext = shark.enc(plaintext, b'VerySecureKeyMustKeepSecretDontTellAnyone', iv)
|
||||||
|
|
||||||
|
high = score(model, ciphertext, plaintext)
|
||||||
|
low = score(model, ciphertext, plaintextAlt)
|
||||||
|
mid = score(model, ciphertext, plaintextSemi)
|
||||||
|
|
||||||
|
print({'h': high, 'l': low, 'm': mid})
|
||||||
|
|
||||||
|
def load():
|
||||||
|
model = Model()
|
||||||
|
model.load_state_dict(torch.load('wh_discriminator.n'))
|
||||||
|
model.eval()
|
||||||
|
return model
|
||||||
|
|
||||||
|
if __name__=="__main__":
|
||||||
|
m = load()
|
||||||
|
test_scoring(m)
|
7
shark.py
7
shark.py
@ -14,14 +14,17 @@ bs = int(256/8)
|
|||||||
def xor(ta,tb):
|
def xor(ta,tb):
|
||||||
return bytes(a ^ b for a, b in zip(ta, tb))
|
return bytes(a ^ b for a, b in zip(ta, tb))
|
||||||
|
|
||||||
|
def genIV():
|
||||||
|
return random.randint(0, 2**(bs-1)).to_bytes(bs, byteorder='big')
|
||||||
|
|
||||||
def enc(plaintext, key, iv):
|
def enc(plaintext, key, iv):
|
||||||
ciphertext = bytes()
|
ciphertext = bytes()
|
||||||
for i in range(math.ceil(len(plaintext)/bs)):
|
for i in range(math.ceil(len(plaintext)/bs)):
|
||||||
m = hashlib.sha256()
|
m = hashlib.sha256()
|
||||||
m.update(xor(key, iv + i.to_bytes(bs, byteorder='big')))
|
m.update(xor(key, iv + i.to_bytes(bs, byteorder='big')))
|
||||||
k = m.digest()
|
k = m.digest()
|
||||||
ciphertext += xor(k, plaintext[bs*i:][:bs].ljust(bs, b'0'))
|
|
||||||
iv = (int.from_bytes(iv, byteorder='big')+1).to_bytes(bs, byteorder='big')
|
iv = (int.from_bytes(iv, byteorder='big')+1).to_bytes(bs, byteorder='big')
|
||||||
|
ciphertext += xor(k, plaintext[bs*i:][:bs].ljust(bs, b'0'))
|
||||||
return ciphertext
|
return ciphertext
|
||||||
|
|
||||||
def dec(ciphertext, key, iv):
|
def dec(ciphertext, key, iv):
|
||||||
@ -34,6 +37,6 @@ def getSample(length, src=None, key=b'VerySecureKeyMustKeepSecretDontTellAnyone'
|
|||||||
r = os.urandom(length*bs)
|
r = os.urandom(length*bs)
|
||||||
return (r, 0)
|
return (r, 0)
|
||||||
else:
|
else:
|
||||||
iv = random.randint(0, 2**(bs-1)).to_bytes(bs, byteorder='big')
|
iv = genIV()
|
||||||
b = bytes(length*bs)
|
b = bytes(length*bs)
|
||||||
return (enc(b, key, iv), 1)
|
return (enc(b, key, iv), 1)
|
||||||
|
@ -40,26 +40,34 @@ def train(model, seq_len=16*64):
|
|||||||
criterion = nn.BCELoss()
|
criterion = nn.BCELoss()
|
||||||
optimizer = optim.Adam(model.parameters(), lr=0.0001)
|
optimizer = optim.Adam(model.parameters(), lr=0.0001)
|
||||||
|
|
||||||
|
state_h = [None,None]
|
||||||
|
state_c = [None,None]
|
||||||
|
blob = [None,None]
|
||||||
|
correct = [None,None]
|
||||||
|
|
||||||
for epoch in range(1024):
|
for epoch in range(1024):
|
||||||
state_h, state_c = model.init_state(seq_len)
|
state_h[0], state_c[0] = model.init_state(seq_len)
|
||||||
|
state_h[1], state_c[1] = model.init_state(seq_len)
|
||||||
|
|
||||||
blob, y = shark.getSample(min(seq_len, 16*(epoch+1)), epoch%2)
|
blob[0], _ = shark.getSample(min(seq_len, 16*(epoch+1)), 0)
|
||||||
|
blob[1], _ = shark.getSample(min(seq_len, 16*(epoch+1)), 1)
|
||||||
optimizer.zero_grad()
|
optimizer.zero_grad()
|
||||||
for i in range(len(blob)):
|
for i in range(len(blob[0])):
|
||||||
x = torch.tensor([[[float(d) for d in bin(blob[i])[2:].zfill(8)]]], dtype=torch.float32)
|
for t in range(2):
|
||||||
y_pred, (state_h, state_c) = model(x, (state_h, state_c))
|
x = torch.tensor([[[float(d) for d in bin(blob[t][i])[2:].zfill(8)]]], dtype=torch.float32)
|
||||||
loss = criterion(y_pred[0][0][0], torch.tensor(y, dtype=torch.float32))
|
y_pred, (state_h[t], state_c[t]) = model(x, (state_h[t], state_c[t]))
|
||||||
|
loss = criterion(y_pred[0][0][0], torch.tensor(t, dtype=torch.float32))
|
||||||
|
|
||||||
state_h = state_h.detach()
|
state_h[t] = state_h[t].detach()
|
||||||
state_c = state_c.detach()
|
state_c[t] = state_c[t].detach()
|
||||||
|
|
||||||
loss.backward()
|
loss.backward()
|
||||||
optimizer.step()
|
optimizer.step()
|
||||||
|
|
||||||
correct = round(y_pred.item()) == y
|
correct[t] = round(y_pred.item()) == t
|
||||||
ltLoss = ltLoss*0.9 + 0.1*loss.item()
|
ltLoss = ltLoss*0.9 + 0.1*loss.item()
|
||||||
lltLoss = lltLoss*0.9 + 0.1*ltLoss
|
lltLoss = lltLoss*0.9 + 0.1*ltLoss
|
||||||
print({ 'epoch': epoch, 'loss': loss.item(), 'ltLoss': ltLoss, 'correct?': correct })
|
print({ 'epoch': epoch, 'loss': loss.item(), 'ltLoss': ltLoss, 'ok0': correct[0], 'ok1': correct[1], 'succ': correct[0] and correct[1] })
|
||||||
if epoch % 8 == 0:
|
if epoch % 8 == 0:
|
||||||
torch.save(model.state_dict(), 'model_savepoints/'+tid+'_'+str(epoch)+'.n')
|
torch.save(model.state_dict(), 'model_savepoints/'+tid+'_'+str(epoch)+'.n')
|
||||||
|
|
Loading…
Reference in New Issue
Block a user