forked from tommyrot/superseriousstats
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathparser_mirc6.php
126 lines (112 loc) · 5.78 KB
/
parser_mirc6.php
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
<?php
/**
* Copyright (c) 2009-2015, Jos de Ruijter <jos@dutnie.nl>
*/
/**
* Parse instructions for the mIRC6 logfile format.
*
* Line Format Notes
* ---------------------------------------------------------------------------------------------------------------------
* Normal <NICK> MSG Skip empty lines.
* Action ** NICK MSG "mIRC6hack" syntax. Skip empty actions.
* Slap ** NICK slaps MSG "mIRC6hack" syntax. Slaps may lack a (valid)
* target.
* Nickchange * NICK is now known as NICK
* Join * NICK (HOST) has joined CHAN
* Part * NICK (HOST) has left CHAN (MSG) Part message may be absent, or empty due to
* normalization.
* Quit * NICK (HOST) Quit (MSG) Quit message may be absent, or empty due to
* normalization.
* Mode * NICK sets mode: +o-v NICK NICK Only check for combinations of ops (+o) and
* voices (+v).
* Topic * NICK changes topic to 'MSG' Skip empty topics.
* Kick * NICK was kicked by NICK (MSG) Kick message may be empty due to normalization.
* ---------------------------------------------------------------------------------------------------------------------
*
* Notes:
* - normalize_line() scrubs all lines before passing them on to parse_line().
* - The way mIRC logs actions is pretty dumb, we can spoof nearly all other line types with our actions. Even non-chat
* messages are logged with the same syntax. For this reason we won't parse for actions. There is a little workaround
* script available however, referred to as "mIRC6hack". It's on the howto.
* - Given our handling of "action" lines (and lack thereof) the order of the regular expressions below is irrelevant
* (current order aims for best performance).
* - The most common channel prefixes are "#&!+" and the most common nick prefixes are "~&@%+!*". If one of the nick
* prefixes slips through then validate_nick() will fail.
* - In certain cases $matches[] won't contain index items if these optionally appear at the end of a line. We use
* empty() to check whether an index item is both set and has a value.
*/
class parser_mirc6 extends parser
{
/**
* Parse a line for various chat data.
*/
protected function parse_line($line)
{
/**
* "Normal" lines.
*/
if (preg_match('/^\[(?<time>\d{2}:\d{2}(:\d{2})?)\] <[~&@%+!*]?(?<nick>\S+)> (?<line>.+)$/', $line, $matches)) {
$this->set_normal($matches['time'], $matches['nick'], $matches['line']);
/**
* "Join" lines.
*/
} elseif (preg_match('/^\[(?<time>\d{2}:\d{2}(:\d{2})?)\] \* (?<nick>\S+) \(\S+\) has joined [#&!+]\S+$/', $line, $matches)) {
$this->set_join($matches['time'], $matches['nick']);
/**
* "Quit" lines.
*/
} elseif (preg_match('/^\[(?<time>\d{2}:\d{2}(:\d{2})?)\] \* (?<nick>\S+) \(\S+\) Quit( \(.*\))?$/', $line, $matches)) {
$this->set_quit($matches['time'], $matches['nick']);
/**
* "Mode" lines.
*/
} elseif (preg_match('/^\[(?<time>\d{2}:\d{2}(:\d{2})?)\] \* (?<nick_performing>\S+) sets mode: (?<modes>[-+][ov]+([-+][ov]+)?) (?<nicks_undergoing>\S+( \S+)*)$/', $line, $matches)) {
$modenum = 0;
$nicks_undergoing = explode(' ', $matches['nicks_undergoing']);
for ($i = 0, $j = strlen($matches['modes']); $i < $j; $i++) {
$mode = substr($matches['modes'], $i, 1);
if ($mode === '-' || $mode === '+') {
$modesign = $mode;
} else {
$this->set_mode($matches['time'], $matches['nick_performing'], $nicks_undergoing[$modenum], $modesign.$mode);
$modenum++;
}
}
/**
* "Action" and "slap" lines.
*/
} elseif (preg_match('/^\[(?<time>\d{2}:\d{2}(:\d{2})?)\] \*\* [~&@%+!*]?(?<line>(?<nick_performing>\S+) ((?<slap>[sS][lL][aA][pP][sS]( (?<nick_undergoing>\S+)( .+)?)?)|(.+)))$/', $line, $matches)) {
if (!empty($matches['slap'])) {
$this->set_slap($matches['time'], $matches['nick_performing'], (!empty($matches['nick_undergoing']) ? $matches['nick_undergoing'] : null));
}
$this->set_action($matches['time'], $matches['nick_performing'], $matches['line']);
/**
* "Nickchange" lines.
*/
} elseif (preg_match('/^\[(?<time>\d{2}:\d{2}(:\d{2})?)\] \* (?<nick_performing>\S+) is now known as (?<nick_undergoing>\S+)$/', $line, $matches)) {
$this->set_nickchange($matches['time'], $matches['nick_performing'], $matches['nick_undergoing']);
/**
* "Part" lines.
*/
} elseif (preg_match('/^\[(?<time>\d{2}:\d{2}(:\d{2})?)\] \* (?<nick>\S+) \(\S+\) has left [#&!+]\S+( \(.*\))?$/', $line, $matches)) {
$this->set_part($matches['time'], $matches['nick']);
/**
* "Topic" lines.
*/
} elseif (preg_match('/^\[(?<time>\d{2}:\d{2}(:\d{2})?)\] \* (?<nick>\S+) changes topic to \'(?<line>.+)\'$/', $line, $matches)) {
if ($matches['line'] !== ' ') {
$this->set_topic($matches['time'], $matches['nick'], $matches['line']);
}
/**
* "Kick" lines.
*/
} elseif (preg_match('/^\[(?<time>\d{2}:\d{2}(:\d{2})?)\] \* (?<line>(?<nick_undergoing>\S+) was kicked by (?<nick_performing>\S+) \(.*\))$/', $line, $matches)) {
$this->set_kick($matches['time'], $matches['nick_performing'], $matches['nick_undergoing'], $matches['line']);
/**
* Skip everything else.
*/
} elseif ($line !== '') {
output::output('debug', __METHOD__.'(): skipping line '.$this->linenum.': \''.$line.'\'');
}
}
}