InferringIntention/keyboard_and_mouse/sampler_user.py
2024-03-24 23:42:27 +01:00

68 lines
2 KiB
Python

import numpy as np
from numpy import genfromtxt
import csv
import pandas
import argparse
def sample_predciton(path, rate):
data = pandas.read_csv(path).values
task_list = [0, 1, 2, 3, 4, 5, 6]
start = 0
stop = 0
num_unique = np.unique(data[:,1])
samples = []
for j in task_list:
for i in num_unique:
inx = np.where((data[:,1] == i) & (data[:,-2] == j))
samples.append(data[inx])
for i in range(len(samples)):
n = int(len(samples[i])*(100-rate)/100)
if n == 0:
n = 1
samples[i] = samples[i][:-n]
if len(samples[i]) == 0:
print('len of after sampling',len(samples[i]))
return np.vstack(samples)
def main():
# parsing parameters
parser = argparse.ArgumentParser(description='')
parser.add_argument('--batch_size', type=int, default=8, help='batch size')
parser.add_argument('--lr', type=float, default=1e-4, help='learning rate')
parser.add_argument('--hidden_size', type=int, default=128, help='hidden_size')
parser.add_argument('--model_type', type=str, default='lstmlast', help='model type')
args = parser.parse_args()
task = np.arange(7)
user_num = 5
bs = args.batch_size
lr = args.lr # 1e-4
hs = args.hidden_size #128
model_type = args.model_type #'lstmlast'
rate = [10, 20, 30, 40, 50, 60, 70, 80, 90]
for i in task:
for j in rate:
for l in range(user_num):
pred_path = "prediction/task" + str(i) + "/" + model_type + "_bs_" + str(bs) + "_lr_" + str(lr) + "_hidden_size_" + str(hs) + "/user" + str(l) + "_pred.csv"
save_path = "prediction/task" + str(i) + "/" + model_type + "_bs_" + str(bs) + "_lr_" + str(lr) + "_hidden_size_" + str(hs) + "/user" + str(l) + "_rate_" + str(j) + "_pred.csv"
data = sample_predciton(pred_path, j)
head = []
for r in range(7):
head.append('act'+str(r+1))
head.append('task_name')
head.append('gt')
head.insert(0,'action_id')
pandas.DataFrame(data[:,1:]).to_csv(save_path, header=head)
if __name__ == '__main__':
# split the prediction by length, from 10% to 90%
main()