-
Notifications
You must be signed in to change notification settings - Fork 3
/
Copy pathagent_random.py
89 lines (62 loc) · 2.27 KB
/
agent_random.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
import evaluation_pb2
import evaluation_pb2_grpc
import grpc
import os
import pickle
import time
import numpy as np
time.sleep(30)
LOCAL_EVALUATION = os.environ.get("LOCAL_EVALUATION")
if LOCAL_EVALUATION:
channel = grpc.insecure_channel("environment:8086")
else:
channel = grpc.insecure_channel("localhost:8086")
def pack_for_grpc(entity):
return pickle.dumps(entity)
def unpack_for_grpc(entity):
return pickle.loads(entity)
str_test = 'August 1, 11:00AM' # <-- to be removed, only for testing
stub = evaluation_pb2_grpc.EnvironmentStub(channel)
print( unpack_for_grpc(
stub.get_output_keys(
evaluation_pb2.Package(SerializedEntity=pack_for_grpc(None))
).SerializedEntity
))
print(f'Len OBS: {len(unpack_for_grpc( stub.reset(evaluation_pb2.Package(SerializedEntity=pack_for_grpc(None))).SerializedEntity))}')
print("Original Ouput Obs keys:"+str(unpack_for_grpc(
stub.get_output_keys(
evaluation_pb2.Package(SerializedEntity=pack_for_grpc(None))
).SerializedEntity
)))
keys = ['hand_pos']
unpack_for_grpc(
stub.set_output_keys(
evaluation_pb2.Package(SerializedEntity=pack_for_grpc(keys))
).SerializedEntity
)
print("Reduced Set of Ouput Obs keys: "+str(unpack_for_grpc(
stub.get_output_keys(
evaluation_pb2.Package(SerializedEntity=pack_for_grpc(None))
).SerializedEntity
))+" Len:"+str(len(unpack_for_grpc( stub.reset(evaluation_pb2.Package(SerializedEntity=pack_for_grpc(None))).SerializedEntity))))
flag = None
counter = 0
while not flag :
if counter == 0:
print('BB ('+str_test+'): Start Resetting the environment and get 1st obs')
obs = unpack_for_grpc(
stub.reset(
evaluation_pb2.Package(SerializedEntity=pack_for_grpc(None))
).SerializedEntity
)
action = np.random.rand(39)
## stub gets info from the environment
p = evaluation_pb2.Package(SerializedEntity=pack_for_grpc(action))
s = stub.act_on_environment(p)
ss = s.SerializedEntity
base = unpack_for_grpc(ss)
obs = base["feedback"][0]
flag = base["feedback"][2]
print(f"BAODING ({str_test}): Agent Feedback iter {counter} -- solved: {flag}")
print("*" * 100)
counter +=1