make.bad_link.pages 3.55 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89
#!/bin/sh
date="$1"
if [ -z $date ] ; then
	date=`date +%Y%m%d`	
fi
topdir=/srv/www-master.debian.org/htdocs/build-logs/urlcheck
[ -d $topdir ] || mkdir $topdir

dir='MailingLists banners Bugs consultants events intro legal logos mirror misc partners volatile vote y2k other'
./prune.pl logs/web.$date > logs/web.$date.bad
for loc in $dir ; do
	./bad_pages.pl $loc < logs/web.$date.bad > $topdir/$loc ;
	./extract_lang.pl en $topdir/$loc > $topdir/$loc.en
done

# Disabled, see note in run.urlcheck
# [ -d $topdir/security ] || mkdir $topdir/security
# dir='security/1997 security/1998 security/1999 security/2000 security/2001 security/2002 security/2003 security/2004 security/2005 security/2006 security/2007 security/2008 security/2009 security/2010 security/2011 security/undated'
# ./prune.pl logs/web.$date.sec > logs/web.$date.sec.bad
# for loc in $dir ; do
# 	./bad_pages.pl $loc < logs/web.$date.sec.bad > $topdir/$loc ;
# 	./extract_lang.pl en $topdir/$loc > $topdir/$loc.en
# done

[ -d $topdir/releases ] || mkdir $topdir/releases
dir='releases/stable releases/testing releases/unstable releases/slink releases/potato releases/woody releases/sarge releases/etch releases/lenny releases/2.1 releases/2.2 releases/3.0 releases/3.1 releases/4.0 releases/5.0'
./prune.pl logs/web.$date.rel > logs/web.$date.rel.bad
for loc in $dir ; do
	./bad_pages.pl $loc < logs/web.$date.rel.bad > $topdir/$loc ;
	./extract_lang.pl en $topdir/$loc > $topdir/$loc.en
done

dir='CD'
./prune.pl logs/web.$date.cd > logs/web.$date.cd.bad
for loc in $dir ; do
	./bad_pages.pl $loc < logs/web.$date.cd.bad > $topdir/$loc ;
	./extract_lang.pl en $topdir/$loc > $topdir/$loc.en
done

dir='devel'
./prune.pl logs/web.$date.devel > logs/web.$date.devel.bad
for loc in $dir ; do
	./bad_pages.pl $loc < logs/web.$date.devel.bad > $topdir/$loc ;
	./extract_lang.pl en $topdir/$loc > $topdir/$loc.en
done

dir='distrib'
./prune.pl logs/web.$date.distrib > logs/web.$date.distrib.bad
for loc in $dir ; do
	./bad_pages.pl $loc < logs/web.$date.distrib.bad > $topdir/$loc ;
	./extract_lang.pl en $topdir/$loc > $topdir/$loc.en
done

dir='doc'
./prune.pl logs/web.$date.doc > logs/web.$date.doc.bad
for loc in $dir ; do
	./bad_pages.pl $loc < logs/web.$date.doc.bad > $topdir/$loc ;
	./extract_lang.pl en $topdir/$loc > $topdir/$loc.en
done

dir='international'
./prune.pl logs/web.$date.intl > logs/web.$date.intl.bad
for loc in $dir ; do
	./bad_pages.pl $loc < logs/web.$date.intl.bad > $topdir/$loc ;
	./extract_lang.pl en $topdir/$loc > $topdir/$loc.en
done

dir='users'
./prune.pl logs/web.$date.users > logs/web.$date.users.bad
for loc in $dir ; do
	./bad_pages.pl $loc < logs/web.$date.users.bad > $topdir/$loc ;
	./extract_lang.pl en $topdir/$loc > $topdir/$loc.en
done

[ -d $topdir/News ] || mkdir $topdir/News
dir='News/1998 News/1999 News/2000 News/2001 News/2002 News/2003 News/2004 News/2005 News/2006 News/2007 News/2008 News/2009 News/2010 News/2011 News/weekly'
./prune.pl logs/web.$date.news > logs/web.$date.news.bad
for loc in $dir ; do
	./bad_pages.pl $loc < logs/web.$date.news.bad > $topdir/$loc ;
	./extract_lang.pl en $topdir/$loc > $topdir/$loc.en
done

[ -d $topdir/ports ] || mkdir $topdir/ports
dir='ports/alpha ports/arm ports/amd64 ports/arm ports/beowulf ports/freebsd ports/hppa ports/hurd ports/i386 ports/ia64 ports/kfreebsd-gnu ports/m68k ports/mips ports/netbsd ports/powerpc ports/s390 ports/sparc ports/sparc64'
./prune.pl logs/web.$date.ports > logs/web.$date.ports.bad
for loc in $dir ; do
	./bad_pages.pl $loc < logs/web.$date.ports.bad > $topdir/$loc ;
	./extract_lang.pl en $topdir/$loc > $topdir/$loc.en
done