@@ -2,64 +2,25 @@ namespace VSharp.Explorer
2
2
3
3
open System.Collections .Generic
4
4
open Microsoft.ML .OnnxRuntime
5
+ open System.IO
6
+ open System
7
+ open System.Net
8
+ open System.Net .Sockets
9
+ open System.Text
5
10
open System.Text .Json
6
11
open VSharp
7
12
open VSharp.IL .Serializer
8
13
open VSharp.ML .GameServer .Messages
9
- open System.IO
10
14
11
15
type AIMode =
12
16
| Runner
13
17
| TrainingSendModel
14
18
| TrainingSendEachStep
15
19
16
- type internal AISearcher ( oracle : Oracle , aiAgentTrainingMode : Option < AIAgentTrainingMode >) =
17
- let stepsToSwitchToAI =
18
- match aiAgentTrainingMode with
19
- | None -> 0 u< step>
20
- | Some ( SendModel options) -> options.aiAgentTrainingOptions.stepsToSwitchToAI
21
- | Some ( SendEachStep options) -> options.aiAgentTrainingOptions.stepsToSwitchToAI
22
-
23
- let stepsToPlay =
24
- match aiAgentTrainingMode with
25
- | None -> 0 u< step>
26
- | Some ( SendModel options) -> options.aiAgentTrainingOptions.stepsToPlay
27
- | Some ( SendEachStep options) -> options.aiAgentTrainingOptions.stepsToPlay
28
-
29
- let mutable lastCollectedStatistics =
30
- Statistics ()
31
- let mutable defaultSearcherSteps = 0 u< step>
32
- let mutable ( gameState : Option < GameState >) =
33
- None
34
- let mutable useDefaultSearcher =
35
- stepsToSwitchToAI > 0 u< step>
36
- let mutable afterFirstAIPeek = false
37
- let mutable incorrectPredictedStateId =
38
- false
39
-
40
- let defaultSearcher =
41
- let pickSearcher =
42
- function
43
- | BFSMode -> BFSSearcher () :> IForwardSearcher
44
- | DFSMode -> DFSSearcher () :> IForwardSearcher
45
- | x -> failwithf $" Unexpected default searcher {x}. DFS and BFS supported for now."
46
-
47
- match aiAgentTrainingMode with
48
- | None -> BFSSearcher () :> IForwardSearcher
49
- | Some ( SendModel options) -> pickSearcher options.aiAgentTrainingOptions.aiBaseOptions.defaultSearchStrategy
50
- | Some ( SendEachStep options) -> pickSearcher options.aiAgentTrainingOptions.aiBaseOptions.defaultSearchStrategy
51
-
52
- let mutable stepsPlayed = 0 u< step>
53
-
54
- let isInAIMode () =
55
- ( not useDefaultSearcher) && afterFirstAIPeek
56
-
57
- let q = ResizeArray<_> ()
58
- let availableStates = HashSet<_> ()
59
-
60
- let updateGameState ( delta : GameState ) =
20
+ module GameUtils =
21
+ let updateGameState ( delta : GameState ) ( gameState : Option < GameState >) =
61
22
match gameState with
62
- | None -> gameState <- Some delta
23
+ | None -> Some delta
63
24
| Some s ->
64
25
let updatedBasicBlocks =
65
26
delta.GraphVertices |> Array.map ( fun b -> b.Id) |> HashSet
@@ -106,7 +67,52 @@ type internal AISearcher(oracle: Oracle, aiAgentTrainingMode: Option<AIAgentTrai
106
67
)
107
68
)
108
69
109
- gameState <- Some <| GameState ( vertices.ToArray (), states, edges.ToArray ())
70
+ Some <| GameState ( vertices.ToArray (), states, edges.ToArray ())
71
+ type internal AISearcher ( oracle : Oracle , aiAgentTrainingMode : Option < AIAgentTrainingMode >) =
72
+ let stepsToSwitchToAI =
73
+ match aiAgentTrainingMode with
74
+ | None -> 0 u< step>
75
+ | Some ( SendModel options) -> options.aiAgentTrainingOptions.stepsToSwitchToAI
76
+ | Some ( SendEachStep options) -> options.aiAgentTrainingOptions.stepsToSwitchToAI
77
+
78
+ let stepsToPlay =
79
+ match aiAgentTrainingMode with
80
+ | None -> 0 u< step>
81
+ | Some ( SendModel options) -> options.aiAgentTrainingOptions.stepsToPlay
82
+ | Some ( SendEachStep options) -> options.aiAgentTrainingOptions.stepsToPlay
83
+
84
+ let mutable lastCollectedStatistics =
85
+ Statistics ()
86
+ let mutable defaultSearcherSteps = 0 u< step>
87
+ let mutable ( gameState : Option < GameState >) =
88
+ None
89
+ let mutable useDefaultSearcher =
90
+ stepsToSwitchToAI > 0 u< step>
91
+ let mutable afterFirstAIPeek = false
92
+ let mutable incorrectPredictedStateId =
93
+ false
94
+
95
+ let defaultSearcher =
96
+ let pickSearcher =
97
+ function
98
+ | BFSMode -> BFSSearcher () :> IForwardSearcher
99
+ | DFSMode -> DFSSearcher () :> IForwardSearcher
100
+ | x -> failwithf $" Unexpected default searcher {x}. DFS and BFS supported for now."
101
+
102
+ match aiAgentTrainingMode with
103
+ | None -> BFSSearcher () :> IForwardSearcher
104
+ | Some ( SendModel options) -> pickSearcher options.aiAgentTrainingOptions.aiBaseOptions.defaultSearchStrategy
105
+ | Some ( SendEachStep options) -> pickSearcher options.aiAgentTrainingOptions.aiBaseOptions.defaultSearchStrategy
106
+
107
+ let mutable stepsPlayed = 0 u< step>
108
+
109
+ let isInAIMode () =
110
+ ( not useDefaultSearcher) && afterFirstAIPeek
111
+
112
+ let q = ResizeArray<_> ()
113
+ let availableStates = HashSet<_> ()
114
+
115
+
110
116
111
117
let init states =
112
118
q.AddRange states
@@ -153,7 +159,7 @@ type internal AISearcher(oracle: Oracle, aiAgentTrainingMode: Option<AIAgentTrai
153
159
if Seq.length availableStates > 0 then
154
160
let gameStateDelta =
155
161
collectGameStateDelta ()
156
- updateGameState gameStateDelta
162
+ gameState <- GameUtils. updateGameState gameStateDelta gameState
157
163
let statistics =
158
164
computeStatistics gameState.Value
159
165
Application.applicationGraphDelta.Clear ()
@@ -168,7 +174,7 @@ type internal AISearcher(oracle: Oracle, aiAgentTrainingMode: Option<AIAgentTrai
168
174
else
169
175
let gameStateDelta =
170
176
collectGameStateDelta ()
171
- updateGameState gameStateDelta
177
+ gameState <- GameUtils. updateGameState gameStateDelta gameState
172
178
let statistics =
173
179
computeStatistics gameState.Value
174
180
@@ -184,12 +190,12 @@ type internal AISearcher(oracle: Oracle, aiAgentTrainingMode: Option<AIAgentTrai
184
190
else
185
191
let toPredict =
186
192
match aiMode with
187
- | TrainingSendEachStep ->
193
+ | TrainingSendEachStep
194
+ | TrainingSendModel ->
188
195
if stepsPlayed > 0 u< step> then
189
196
gameStateDelta
190
197
else
191
198
gameState.Value
192
- | TrainingSendModel
193
199
| Runner -> gameState.Value
194
200
195
201
let stateId = oracle.Predict toPredict
@@ -225,15 +231,37 @@ type internal AISearcher(oracle: Oracle, aiAgentTrainingMode: Option<AIAgentTrai
225
231
let arrayOutputJson =
226
232
JsonSerializer.Serialize arrayOutput
227
233
arrayOutputJson
228
-
229
- let writeStep ( gameState : GameState ) ( output : IDisposableReadOnlyCollection < OrtValue >) ( filePath : string ) =
234
+ let stepToString ( gameState : GameState ) ( output : IDisposableReadOnlyCollection < OrtValue >) =
230
235
let gameStateJson =
231
236
JsonSerializer.Serialize gameState
232
- let stateJson = serializeOutput output
233
- File.WriteAllText ( filePath + " _gameState" , gameStateJson)
234
- File.WriteAllText ( filePath + " _nn_output" , stateJson)
237
+ let outputJson = serializeOutput output
238
+ let DELIM = Environment.NewLine
239
+ let strToSaveAsList =
240
+ [
241
+ gameStateJson
242
+ DELIM
243
+ outputJson
244
+ DELIM
245
+ ]
246
+ String.concat " " strToSaveAsList
235
247
236
248
let createOracleRunner ( pathToONNX : string , aiAgentTrainingModelOptions : Option < AIAgentTrainingModelOptions >) =
249
+ let host = " localhost"
250
+ let port =
251
+ match aiAgentTrainingModelOptions with
252
+ | Some options -> options.port
253
+ | None -> 0
254
+
255
+ let client = new TcpClient ()
256
+ client.Connect ( host, port)
257
+ client.SendBufferSize <- 2048
258
+ let stream = client.GetStream ()
259
+
260
+ let saveStep ( gameState : GameState ) ( output : IDisposableReadOnlyCollection < OrtValue >) =
261
+ let bytes =
262
+ Encoding.UTF8.GetBytes ( stepToString gameState output)
263
+ stream.Write ( bytes, 0 , bytes.Length)
264
+ stream.Flush ()
237
265
238
266
let sessionOptions =
239
267
if useGPU then
@@ -254,8 +282,15 @@ type internal AISearcher(oracle: Oracle, aiAgentTrainingMode: Option<AIAgentTrai
254
282
let feedback ( x : Feedback ) = ()
255
283
256
284
let mutable stepsPlayed = 0
285
+ let mutable currentGameState = None
257
286
258
- let predict ( gameState : GameState ) =
287
+ let predict ( gameStateOrDelta : GameState ) =
288
+ let _ =
289
+ match aiAgentTrainingModelOptions with
290
+ | Some _ when not ( stepsPlayed = 0 ) ->
291
+ currentGameState <- GameUtils.updateGameState gameStateOrDelta currentGameState
292
+ | _ -> currentGameState <- Some gameStateOrDelta
293
+ let gameState = currentGameState.Value
259
294
let stateIds =
260
295
Dictionary< uint< stateId>, int> ()
261
296
let verticesIds =
@@ -441,7 +476,7 @@ type internal AISearcher(oracle: Oracle, aiAgentTrainingMode: Option<AIAgentTrai
441
476
442
477
let _ =
443
478
match aiAgentTrainingModelOptions with
444
- | Some options -> writeStep gameState output ( options.outputDirectory + ( $ " /{stepsPlayed} " ))
479
+ | Some _ -> saveStep gameStateOrDelta output
445
480
| None -> ()
446
481
447
482
stepsPlayed <- stepsPlayed + 1
0 commit comments