Skip to content
This repository has been archived by the owner on Sep 26, 2024. It is now read-only.

Commit

Permalink
scrape.pl: make scraper sucks less.
Browse files Browse the repository at this point in the history
  • Loading branch information
KARBOWSKI Piotr committed Jan 21, 2017
1 parent 4e6cdbb commit 3fb9468
Showing 1 changed file with 89 additions and 31 deletions.
120 changes: 89 additions & 31 deletions scrape.pl
Original file line number Diff line number Diff line change
@@ -1,37 +1,95 @@
#!/usr/bin/perl
#!/usr/bin/env perl

use warnings;
use strict;
use XML::Simple;
use LWP::Simple 'get', 'getstore';
use File::Basename 'dirname', 'basename';
use Cwd 'abs_path';

my $script_dir = abs_path(dirname(__FILE__));
chdir($script_dir);
my $feed_raw = get("http://grsecurity.net/testing_rss.php");

my $feed = XMLin($feed_raw, ForceArray => ['item']);
my $filename;
my $link;
my $new_patches;

for(@{$feed->{channel}->{item}}) {
$link = $_->{link};
$filename = basename($link);
if ( ! -e $script_dir . "/test/". $filename ) {
$new_patches++;
print("Downloading ", $filename, " ...\n");
getstore($link . ".sig", $script_dir . "/test/" . $filename . ".sig");
getstore($link, $script_dir . "/test/" . $filename);
}
use autodie qw / :all /;
use LWP::UserAgent;
use File::Basename qw/ fileparse /;
use File::Path qw/ rmtree /;

sub einfo {
printf( "[INFO] >>> %s\n", join( ' ', @_ ) );
}

sub fetch {
my ( $url, $save_to ) = @_;

my $ua = LWP::UserAgent->new;

einfo( "Fetching $url ..." );

my $response = $ua->get( $url, 'Accept-Encoding' => 'gzip' );

if ( $response->is_success ) {
if ( $save_to ) {
open( my $file, '>', $save_to );

my $content = $response->decoded_content;

if ( utf8::is_utf8( $content ) ) {
binmode( $file,':utf8' );
} else {
binmode( $file,':raw' );
}

print $file $content;
close( $file );
return 1;
} else {
return $response->decoded_content;
}
} else {
die "Fetch failed.\n";
}
}

my $script_dir = ( fileparse( __FILE__ ) )[1];
chdir( $script_dir );

my $latest_patch = fetch( 'https://grsecurity.net/latest_test_patch' );
chomp( $latest_patch );
einfo "Latest patch $latest_patch";

my ( $grsec_major_version, $kernel_version, $grsec_patch_version ) = ( $latest_patch =~ m/^grsecurity-([0-9.]+)-([0-9.]+)-([0-9]+)\.patch$/ );

for my $var ( $grsec_major_version, $kernel_version, $grsec_patch_version ) {
die "Wrong patch file name?\n" unless defined( $var ) and length $var;
}
if ($new_patches) {
print("Downloading changelog-test.txt ...\n");
getstore("http://grsecurity.net/changelog-test.txt", $script_dir . "/test/changelog-test.txt");

system("git", "add", $script_dir . "/test/" . $filename, $script_dir . "/test/changelog-test.txt", $script_dir . "/test/" . $filename . ".sig");
system("git", "commit", "-a", "-m", "Auto commit, " . $new_patches . " new patch{es}.");
system("git", "push");

if ( -f "test/$kernel_version/$latest_patch" ) {
einfo "Already downloaded.";
exit 0;
}

if ( -d 'tmp' ) {
rmtree( 'tmp' );
}
mkdir( 'tmp' );

fetch( "https://grsecurity.net/test/$latest_patch", "tmp/$latest_patch" );
fetch( "https://grsecurity.net/test/$latest_patch.sig", "tmp/$latest_patch.sig" );
fetch( 'https://grsecurity.net/changelog-test.txt', 'tmp/changelog-test.txt' );

mkdir( "test/$kernel_version" ) if not ( -d "test/$kernel_version" );
rename( "tmp/$latest_patch", "test/$kernel_version/$latest_patch" );
rename( "tmp/$latest_patch.sig", "test/$kernel_version/$latest_patch.sig" );
rename( 'tmp/changelog-test.txt', 'test/changelog-test.txt' );

einfo 'git add ..,';
system(
"git", "add",
"test/$kernel_version/$latest_patch",
"test/$kernel_version/$latest_patch.sig",
'test/changelog-test.txt'
);

einfo 'git commit ...';
system(
"git", "commit", "-m", "Auto commit, $latest_patch added.",
"test/$kernel_version/$latest_patch",
"test/$kernel_version/$latest_patch.sig",
'test/changelog-test.txt'
);

einfo 'git push ...';
#system("git", "push");

0 comments on commit 3fb9468

Please sign in to comment.