Browse Source

Better statistics and alphanumerical tokens

Loweel 4 years ago
parent
commit
bef4972180
3 changed files with 11 additions and 22 deletions
  1. 1 1
      .gitignore
  2. 9 20
      bayes.json
  3. 1 1
      classifier.go

+ 1 - 1
.gitignore

@@ -1,4 +1,4 @@
 zardoz 
-bayes.txt
+bayes.*
 /logs
 logs/*

+ 9 - 20
bayes.json

@@ -1,28 +1,16 @@
 STATS: {
  "BLOCKLEARN": 3,
- "LEARN-BAD": 9,
- "MEH": 3,
- "PASSLEARN": 3,
+ "GENERATION": 2,
+ "LEARN-BAD": 12,
+ "MEH": 10,
+ "PASSLEARN": 2,
  "YOUNG": 15
 }
  WORKING: {
- "/favicon.ico": "GOOD",
- "accept": "MEH",
- "agent": "MEH",
- "cors": "GOOD",
- "curl": "MEH",
- "favicon": "GOOD",
- "google": "GOOD",
- "guns": "GOOD",
- "host": "MEH",
- "http": "MEH",
- "localhost": "BAD",
- "penis": "BAD",
- "qualcosa": "BAD",
- "user": "MEH",
- "wallet": "BAD"
-}
- LEARNING: {
+ "22170": "BAD",
+ "28765": "BAD",
+ "3672": "BAD",
+ "8089": "BAD",
  "accept": "MEH",
  "agent": "MEH",
  "curl": "MEH",
@@ -33,3 +21,4 @@ STATS: {
  "qualcosa": "BAD",
  "user": "MEH"
 }
+ LEARNING: {}

+ 1 - 1
classifier.go

@@ -69,7 +69,7 @@ func blockAndlearn(resp *http.Response) error {
 
 func sanitizeHeaders(s string) string {
 
-	re := regexp.MustCompile(`[a-zA-Z]{4,32}|([0-9]{1,3}\.[0-9]{1,3}\.[0-9]{1,3}\.[0-9]{1,3})|([0-9a-fA-F]{8}\-[0-9a-fA-F]{4}\-[0-9a-fA-F]{4}\-[0-9a-fA-F]{4}\-[0-9a-fA-F]{12})`)
+	re := regexp.MustCompile(`[[:alnum:]]{4,32}|([0-9]{1,3}\.[0-9]{1,3}\.[0-9]{1,3}\.[0-9]{1,3})|([0-9a-fA-F]{8}\-[0-9a-fA-F]{4}\-[0-9a-fA-F]{4}\-[0-9a-fA-F]{4}\-[0-9a-fA-F]{12})`)
 	matched := re.FindAllString(s, -1)
 
 	uMatched := Unique(matched)