parse_flow.pl 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343
  1. #!/usr/bin/perl
  2. #
  3. # Copyright (C) Roman Dmitiriev, rnd@rajven.ru
  4. #
  5. use English;
  6. use base;
  7. use FindBin '$Bin';
  8. use lib "$Bin/";
  9. use strict;
  10. use DBI;
  11. use Time::Local;
  12. use Net::Patricia;
  13. use Data::Dumper;
  14. use Date::Parse;
  15. use Socket;
  16. use Rstat::config;
  17. use Rstat::main;
  18. use Rstat::net_utils;
  19. use Rstat::mysql;
  20. use Parallel::ForkManager;
  21. setpriority(0,0,19);
  22. my $router_id;
  23. if (scalar @ARGV>1) { $router_id=shift(@ARGV); } else { $router_id=$ARGV[0]; }
  24. if (!$router_id) {
  25. db_log_error($dbh,"Router id not defined! Bye...");
  26. exit 110;
  27. }
  28. my $fork_count = $cpu_count*10;
  29. my $timeshift = get_option($dbh,55)*60;
  30. db_log_debug($dbh,"Import traffic from router id: $router_id start. Timestep $timeshift sec.") if ($debug);
  31. my %stats;
  32. $stats{pkt}{all}=0;
  33. $stats{pkt}{user_in}=0;
  34. $stats{pkt}{user_out}=0;
  35. $stats{pkt}{free}=0;
  36. $stats{pkt}{unknown}=0;
  37. $stats{line}{all}=0;
  38. $stats{line}{user}=0;
  39. $stats{line}{free}=0;
  40. $stats{line}{unknown}=0;
  41. # net objects
  42. my $users = new Net::Patricia;
  43. InitSubnets();
  44. #get userid list
  45. my @auth_list_ref = get_records_sql($dbh,"SELECT id,ip,user_id,save_traf FROM User_auth where deleted=0 ORDER by user_id");
  46. my %user_stats;
  47. foreach my $row (@auth_list_ref) {
  48. $users->add_string($row->{ip},$row->{id});
  49. $user_stats{$row->{ip}}{net}=$row->{ip};
  50. $user_stats{$row->{ip}}{auth_id}=$row->{id};
  51. $user_stats{$row->{ip}}{user_id}=$row->{user_id};
  52. $user_stats{$row->{ip}}{save_traf}=$row->{save_traf};
  53. $user_stats{$row->{ip}}{in}=0;
  54. $user_stats{$row->{ip}}{out}=0;
  55. $user_stats{$row->{ip}}{pkt_in}=0;
  56. $user_stats{$row->{ip}}{pkt_out}=0;
  57. }
  58. my $start_time = localtime();
  59. my $hour_date;
  60. my $minute_date;
  61. my @batch_sql_traf=();
  62. my $pm = Parallel::ForkManager->new($fork_count);
  63. $pm->run_on_finish(
  64. sub {
  65. my ($pid, $exit, $ident, $signal, $core, $data) = @_;
  66. if ($data) {
  67. my $dataref = ${$data};
  68. foreach my $user_ip (keys %{$dataref->{stats}}) {
  69. $user_stats{$user_ip}{in} += $dataref->{stats}{$user_ip}{in};
  70. $user_stats{$user_ip}{pkt_in} +=$dataref->{stats}{$user_ip}{pkt_in};
  71. $user_stats{$user_ip}{out} += $dataref->{stats}{$user_ip}{out};
  72. $user_stats{$user_ip}{pkt_out} +=$dataref->{stats}{$user_ip}{pkt_out};
  73. }
  74. $stats{pkt}{all}+=$dataref->{pkt}{all};
  75. $stats{pkt}{user_in}+=$dataref->{pkt}{user_in};
  76. $stats{pkt}{user_out}+=$dataref->{pkt}{user_out};
  77. $stats{pkt}{free}+=$dataref->{pkt}{free};
  78. $stats{pkt}{unknown}+=$dataref->{pkt}{unknown};
  79. $stats{line}{all}+=$dataref->{line}{all};
  80. $stats{line}{user}+=$dataref->{line}{user};
  81. $stats{line}{free}+=$dataref->{line}{free};
  82. $stats{line}{unknown}+=$dataref->{line}{unknown};
  83. if (scalar(@{$dataref->{sql}})) {
  84. $dbh=init_db();
  85. $dbh->{AutoCommit} = 0;
  86. my $sth;
  87. foreach my $sSQL(@{$dataref->{sql}}) {
  88. $sth = $dbh->prepare($sSQL);
  89. $sth->execute;
  90. }
  91. $sth->finish;
  92. $dbh->{AutoCommit} = 1;
  93. }
  94. }
  95. }
  96. );
  97. my @input_buf=();
  98. my $line_count = 0;
  99. my $first_step = 0;
  100. while (my $line = <STDIN>) {
  101. chomp($line);
  102. $line=~s/\s+//g;
  103. if (!$first_step) {
  104. my ($l_time,$l_proto,$l_src_ip,$l_dst_ip,$l_src_port,$l_dst_port,$l_packets,$l_bytes,$l_in_dev,$l_out_dev) = split(/;/,$line);
  105. $start_time = $l_time;
  106. $first_step = 1;
  107. }
  108. $line_count++;
  109. push(@input_buf,$line);
  110. if ($line_count < 5000) { next; }
  111. $line_count = 0;
  112. my @tmp = @input_buf;
  113. undef @input_buf;
  114. $pm->start and next;
  115. my $ret = calc_stats(\@tmp);
  116. $pm->finish(0, \$ret);
  117. }
  118. if (scalar(@input_buf)) {
  119. $pm->start;
  120. my $ret = calc_stats(\@input_buf);
  121. $pm->finish(0, \$ret);
  122. }
  123. $pm->wait_all_children;
  124. undef(@input_buf);
  125. sub calc_stats {
  126. my $lines = shift;
  127. my $lines_stats;
  128. $lines_stats->{pkt}{all}=0;
  129. $lines_stats->{pkt}{user_in}=0;
  130. $lines_stats->{pkt}{user_out}=0;
  131. $lines_stats->{pkt}{free}=0;
  132. $lines_stats->{pkt}{unknown}=0;
  133. $lines_stats->{line}{all}=0;
  134. $lines_stats->{line}{user}=0;
  135. $lines_stats->{line}{free}=0;
  136. $lines_stats->{line}{unknown}=0;
  137. foreach my $line (@$lines) {
  138. my ($l_time,$l_proto,$l_src_ip,$l_dst_ip,$l_src_port,$l_dst_port,$l_packets,$l_bytes,$l_in_dev,$l_out_dev) = split(/;/,$line);
  139. $lines_stats->{pkt}{all}+=$l_packets;
  140. $lines_stats->{line}{all}++;
  141. if (!$l_time) { $lines_stats->{line}{illegal}++; $lines_stats->{pkt}{illegal}+=$l_packets; next; }
  142. if ($l_src_ip eq '0.0.0.0') { $lines_stats->{line}{illegal}++; $lines_stats->{pkt}{illegal}+=$l_packets; next; }
  143. if ($l_dst_ip eq '0.0.0.0') { $lines_stats->{line}{illegal}++; $lines_stats->{pkt}{illegal}+=$l_packets; next; }
  144. if ($l_src_ip eq '255.255.255.255') { $lines_stats->{line}{illegal}++; $lines_stats->{pkt}{illegal}+=$l_packets; next; }
  145. if ($l_dst_ip eq '255.255.255.255') { $lines_stats->{line}{illegal}++; $lines_stats->{pkt}{illegal}+=$l_packets; next; }
  146. #special networks
  147. if ($Special_Nets->match_string($l_src_ip) or $Special_Nets->match_string($l_dst_ip)) { $lines_stats->{line}{illegal}++; $lines_stats->{pkt}{illegal}+=$l_packets; next; }
  148. #unknown networks
  149. if (!$office_networks->match_string($l_src_ip) and !$office_networks->match_string($l_dst_ip)) { $lines_stats->{line}{illegal}++; $lines_stats->{pkt}{illegal}+=$l_packets; next; }
  150. #local forward
  151. if ($office_networks->match_string($l_src_ip) and $office_networks->match_string($l_dst_ip)) { $lines_stats->{line}{free}++; $lines_stats->{line}{free}+=$l_packets; next; }
  152. #free forward
  153. if ($office_networks->match_string($l_src_ip) and $free_networks->match_string($l_dst_ip)) { $lines_stats->{line}{free}++; $lines_stats->{line}{free}+=$l_packets; next; }
  154. if ($free_networks->match_string($l_src_ip) and $office_networks->match_string($l_dst_ip)) { $lines_stats->{line}{free}++; $lines_stats->{line}{free}+=$l_packets; next; }
  155. my $l_src_ip_aton=StrToIp($l_src_ip);
  156. my $l_dst_ip_aton=StrToIp($l_dst_ip);
  157. my ($sec,$min,$hour,$day,$month,$year,$zone) = (localtime($l_time))[0,1,2,3,4,5];
  158. $month++;
  159. $year += 1900;
  160. my $full_time = $dbh->quote(sprintf "%04d-%02d-%02d %02d:%02d:%02d",$year,$month,$day,$hour,$min,$sec);
  161. my $user_ip;
  162. my $auth_id;
  163. # find user id
  164. if ($office_networks->match_string($l_src_ip)) {
  165. $user_ip = $l_src_ip;
  166. $lines_stats->{stats}{$user_ip}{ip}=$user_ip;
  167. if (!$lines_stats->{stats}{$user_ip}{out}) { $lines_stats->{stats}{$user_ip}{out}=0; }
  168. if (!$lines_stats->{stats}{$user_ip}{pkt_out}) { $lines_stats->{stats}{$user_ip}{pkt_out}=0; }
  169. $lines_stats->{stats}{$user_ip}{out} += $l_bytes;
  170. $lines_stats->{stats}{$user_ip}{pkt_out} +=$l_packets;
  171. $lines_stats->{line}{user}++;
  172. $lines_stats->{pkt}{user_out}+=$l_packets;
  173. }
  174. if ($office_networks->match_string($l_dst_ip)) {
  175. $user_ip = $l_dst_ip;
  176. $lines_stats->{stats}{$user_ip}{ip}=$l_dst_ip;
  177. if (!$lines_stats->{stats}{$user_ip}{in}) { $lines_stats->{stats}{$user_ip}{in}=0; }
  178. if (!$lines_stats->{stats}{$user_ip}{pkt_in}) { $lines_stats->{stats}{$user_ip}{pkt_in}=0; }
  179. $lines_stats->{stats}{$user_ip}{in} += $l_bytes;
  180. $lines_stats->{stats}{$user_ip}{pkt_in} +=$l_packets;
  181. $lines_stats->{line}{user}++;
  182. $lines_stats->{pkt}{user_in}+=$l_packets;
  183. }
  184. my $auth_id;
  185. #save full packet
  186. if ($save_detail) {
  187. if (($user_ip and $user_stats{$user_ip}{save_traf}) or (!$auth_id and $config_ref{save_detail})) {
  188. if ($user_ip) { $auth_id = $users->match_string($user_ip); }
  189. if (!$auth_id) { $auth_id = 0; }
  190. push(@{$lines_stats->{sql}},"INSERT INTO Traffic_detail (auth_id,router_id,timestamp,proto,src_ip,dst_ip,src_port,dst_port,bytes,pkt) VALUES($auth_id,$router_id,$full_time,'$l_proto',$l_src_ip_aton,$l_dst_ip_aton,'$l_src_port','$l_dst_port','$l_bytes','$l_packets')");
  191. }
  192. }
  193. if ($auth_id) { next; }
  194. if (!$config_ref{add_unknown_user}) { $lines_stats->{line}{illegal}++; $lines_stats->{pkt}{illegal}+=$l_packets; next; }
  195. if (exists $lines_stats->{$l_src_ip}) { $user_ip = $l_src_ip; }
  196. if (exists $lines_stats->{$l_dst_ip}) { $user_ip = $l_dst_ip; }
  197. #add user by src ip only if dst not office network!!!!
  198. if (!$office_networks->match_string($l_dst_ip) and $office_networks->match_string($l_src_ip)) { $user_ip = $l_src_ip; }
  199. if (!$user_ip) { $lines_stats->{line}{illegal}++; $lines_stats->{pkt}{illegal}+=$l_packets; next; }
  200. if ($user_ip eq $l_src_ip) {
  201. $lines_stats->{stats}{$user_ip}{ip}=$user_ip;
  202. $lines_stats->{stats}{$user_ip}{auth_id}= 0;
  203. if (!$lines_stats->{stats}{$user_ip}{out}) { $lines_stats->{stats}{$user_ip}{out}=0; }
  204. if (!$lines_stats->{stats}{$user_ip}{pkt_out}) { $lines_stats->{stats}{$user_ip}{pkt_out}=0; }
  205. $lines_stats->{stats}{$user_ip}{out} += $l_bytes;
  206. $lines_stats->{stats}{$user_ip}{pkt_out} +=$l_packets;
  207. $lines_stats->{line}{user}++;
  208. $lines_stats->{pkt}{user_out}+=$l_packets;
  209. }
  210. if ($user_ip eq $l_dst_ip) {
  211. $lines_stats->{stats}{$user_ip}{ip}=$l_dst_ip;
  212. $lines_stats->{stats}{$user_ip}{auth_id}=0;
  213. if (!$lines_stats->{stats}{$user_ip}{in}) { $lines_stats->{stats}{$user_ip}{in}=0; }
  214. if (!$lines_stats->{stats}{$user_ip}{pkt_in}) { $lines_stats->{stats}{$user_ip}{pkt_in}=0; }
  215. $lines_stats->{stats}{$user_ip}{in} += $l_bytes;
  216. $lines_stats->{stats}{$user_ip}{pkt_in} +=$l_packets;
  217. $lines_stats->{line}{user}++;
  218. $lines_stats->{pkt}{user_in}+=$l_packets;
  219. }
  220. }
  221. return $lines_stats;
  222. }
  223. $dbh=init_db();
  224. ####################################################################################################
  225. #start hour
  226. my ($min,$hour,$day,$month,$year) = (localtime($start_time))[1,2,3,4,5];
  227. my $hour_date1 = $dbh->quote(sprintf "%04d-%02d-%02d %02d:00:00",$year+1900,$month+1,$day,$hour,0,0);
  228. #end hour
  229. my $hour_date2 = $dbh->quote(sprintf "%04d-%02d-%02d %02d:00:00",$year+1900,$month+1,$day,$hour,59,59);
  230. #flow time
  231. my $flow_date = $dbh->quote(sprintf "%04d-%02d-%02d %02d:%02d:00",$year+1900,$month+1,$day,$hour,$min,1);
  232. # update database
  233. foreach my $user_ip (keys %user_stats) {
  234. my $user_ip_aton=StrToIp($user_ip);
  235. my $auth_id = $user_stats{$user_ip}{auth_id};
  236. if (!$auth_id) {
  237. $auth_id=new_auth($dbh,$user_ip);
  238. $user_stats{$user_ip}{auth_id}=$auth_id;
  239. #fix traffic detail for new users
  240. push(@batch_sql_traf,"UPDATE Traffic_detail set auth_id=$auth_id WHERE auth_id=0 AND `timestamp`>='$hour_date1' AND `timestamp`<='$hour_date2' AND (src_ip=$user_ip_aton OR dst_ip=$user_ip_aton)");
  241. }
  242. #current stats
  243. my $tSQL="INSERT INTO User_stats_full (timestamp,auth_id,router_id,byte_in,byte_out,pkt_in,pkt_out,step) VALUES($flow_date,'$user_stats{$user_ip}{auth_id}','$router_id','$user_stats{$user_ip}{in}','$user_stats{$user_ip}{out}','$user_stats{$user_ip}{pkt_in}','$user_stats{$user_ip}{pkt_out}','$timeshift')";
  244. push (@batch_sql_traf,$tSQL);
  245. #last found timestamp
  246. $tSQL="UPDATE User_auth SET `last_found`=$flow_date WHERE id='$user_stats{$user_ip}{auth_id}'";
  247. push (@batch_sql_traf,$tSQL);
  248. #hour stats
  249. # get current stats
  250. my $sql = "SELECT id, byte_in, byte_out FROM User_stats
  251. WHERE `timestamp`>=$hour_date1 AND `timestamp`<=$hour_date2 AND router_id=$router_id AND auth_id=$user_stats{$user_ip}{auth_id}";
  252. my $hour_stat = get_record_sql($dbh,$sql);
  253. if (!$hour_stat) {
  254. my $dSQL="INSERT INTO User_stats (timestamp,auth_id,router_id,byte_in,byte_out) VALUES($flow_date,'$user_stats{$user_ip}{auth_id}','$router_id','$user_stats{$user_ip}{in}','$user_stats{$user_ip}{out}')";
  255. push (@batch_sql_traf,$dSQL);
  256. next;
  257. }
  258. if (!$hour_stat->{byte_in}) { $hour_stat->{byte_in}=0; }
  259. if (!$hour_stat->{byte_out}) { $hour_stat->{byte_out}=0; }
  260. $hour_stat->{byte_in} += $user_stats{$user_ip}{in};
  261. $hour_stat->{byte_out} += $user_stats{$user_ip}{out};
  262. $tSQL="UPDATE User_stats SET byte_in='".$hour_stat->{byte_in}."', byte_out='".$hour_stat->{byte_out}."' WHERE id=".$hour_stat->{id};
  263. push (@batch_sql_traf,$tSQL);
  264. }
  265. $dbh->{AutoCommit} = 0;
  266. my $sth;
  267. foreach my $sSQL(@batch_sql_traf) {
  268. $sth = $dbh->prepare($sSQL);
  269. $sth->execute;
  270. }
  271. $sth->finish;
  272. $dbh->{AutoCommit} = 1;
  273. db_log_debug($dbh,"Import traffic from router id: $router_id stop") if ($debug);
  274. db_log_verbose($dbh,"Recalc quotes started");
  275. recalc_quotes($dbh,$router_id);
  276. db_log_verbose($dbh,"Recalc quotes stopped");
  277. db_log_verbose($dbh,"router id: $router_id stop Traffic statistics, lines: all => $stats{line}{all}, user=> $stats{line}{user}, free => $stats{line}{free}, illegal=> $stats{line}{illegal}");
  278. db_log_verbose($dbh,sprintf("router id: %d stop Traffic speed, line/s: all => %.2f, user=> %.2f, free => %.2f, unknown=> %.2f", $router_id, $stats{line}{all}/$timeshift, $stats{line}{user}/$timeshift, $stats{line}{free}/$timeshift, $stats{line}{illegal}/$timeshift));
  279. db_log_verbose($dbh,"router id: $router_id stop Traffic statistics, pkt: all => $stats{pkt}{all}, user_in=> $stats{pkt}{user_in}, user_in=> $stats{pkt}{user_out}, free => $stats{pkt}{free}, illegal=> $stats{pkt}{illegal}");
  280. db_log_verbose($dbh,sprintf("router id: %d stop Traffic speed, pkt/s: all => %.2f, user_in=> %.2f, user_out=> %.2f, free => %.2f, unknown=> %.2f", $router_id, $stats{pkt}{all}/$timeshift, $stats{pkt}{user_in}/$timeshift, $stats{pkt}{user_out}/$timeshift, $stats{pkt}{free}/$timeshift, $stats{pkt}{illegal}/$timeshift));
  281. $dbh->disconnect;
  282. exit 0;