This repository has been archived by the owner on May 23, 2019. It is now read-only.
-
Notifications
You must be signed in to change notification settings - Fork 18
/
simpleEngineApiExample.py
121 lines (93 loc) · 4.47 KB
/
simpleEngineApiExample.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
#!/usr/bin/env python
############################################################################
# #
# Copyright 2014 Prelert Ltd #
# #
# Licensed under the Apache License, Version 2.0 (the "License"); #
# you may not use this file except in compliance with the License. #
# You may obtain a copy of the License at #
# #
# http://www.apache.org/licenses/LICENSE-2.0 #
# #
# Unless required by applicable law or agreed to in writing, software #
# distributed under the License is distributed on an "AS IS" BASIS, #
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. #
# See the License for the specific language governing permissions and #
# limitations under the License. #
# #
############################################################################
'''
Creates a new job and uploads farequote.csv to it. The job is
then closed and the result buckets queried,
The example file used can be downloaded from
http://s3.amazonaws.com/prelert_demo/farequote.csv and looks like this:
time,airline,responsetime,sourcetype
2014-06-23 00:00:00Z,AAL,132.2046,farequote
2014-06-23 00:00:00Z,JZA,990.4628,farequote
2014-06-23 00:00:00Z,JBU,877.5927,farequote
The script is invoked with 1 positional argument the farequote.csv
file and has optional arguments to specify the location of the
Engine API. Run the script with '--help' to see the options.
The output is CSV print out of date and anomaly score.
If a bucket timestamp is specified only the anomaly records for that bucket
are returned.
'''
import argparse
import sys
import json
import logging
from prelert.engineApiClient import EngineApiClient
# Prelert Engine API connection prarams
HOST = 'localhost'
PORT = 8080
BASE_URL = 'engine/v2'
def setupLogging():
'''
Log to console
'''
logging.basicConfig(level=logging.INFO,format='%(asctime)s %(levelname)s %(message)s')
def parseArguments():
parser = argparse.ArgumentParser()
parser.add_argument("--host", help="The Prelert Engine API host, defaults to "
+ HOST, default=HOST)
parser.add_argument("--port", help="The Prelert Engine API port, defaults to "
+ str(PORT), default=PORT)
parser.add_argument("file", help="Path to farequote.csv")
return parser.parse_args()
def main():
setupLogging()
args = parseArguments()
# Create the REST API client
engine_client = EngineApiClient(args.host, BASE_URL, args.port)
job_config = '{"analysisConfig" : {\
"bucketSpan":3600,\
"detectors" :[{"function":"metric","fieldName":"responsetime","byFieldName":"airline"}] },\
"dataDescription" : {"fieldDelimiter":",", "timeField":"time", "timeFormat":"yyyy-MM-dd HH:mm:ssX"} }'
logging.info("Creating job")
(http_status_code, response) = engine_client.createJob(job_config)
if http_status_code != 201:
print (http_status_code, json.dumps(response))
return
job_id = response['id']
logging.info("Uploading data to " + job_id)
file = open(args.file, 'rb')
(http_status_code, response) = engine_client.upload(job_id, file)
if http_status_code != 202:
print (http_status_code, json.dumps(response))
return
logging.info("Closing job " + job_id)
(http_status_code, response) = engine_client.close(job_id)
if http_status_code != 202:
print (http_status_code, json.dumps(response))
return
logging.info("Get result buckets for job " + job_id)
(http_status_code, response) = engine_client.getAllBuckets(job_id)
if http_status_code != 200:
print (http_status_code, json.dumps(response))
else:
print "Date,Anomaly Score,Max Normalized Probablility"
for bucket in response:
print "{0},{1},{2}".format(bucket['timestamp'], bucket['anomalyScore'],
bucket['maxNormalizedProbability'])
if __name__ == "__main__":
main()