Data Audit

/0

 * 3.9G   a - Looks like old junk, can we get rid of it?
 * 21M    backup
 * 21M    backup.madmappers.20060411.database.sql.gz
 * 1.9G   backup.pinky_worldwindcentral_net.20060301.0.usr.dump -- Do we need this ungzipped/at all?
 * 567M   backup.pinky_worldwindcentral_net.20060301.0.usr.dump.gz.aes
 * 142G   datasets
 * 434M   bmng.topo.bathy.200401 -- Why is BMNG sitting in here not being used?
 * 432M   bmng.topo.bathy.200402
 * 430M   bmng.topo.bathy.200403
 * 428M   bmng.topo.bathy.200404
 * 426M   bmng.topo.bathy.200405
 * 429M   bmng.topo.bathy.200406
 * 420M   bmng.topo.bathy.200407
 * 419M   bmng.topo.bathy.200408
 * 434M   bmng.topo.bathy.200409
 * 435M   bmng.topo.bathy.200410
 * 441M   bmng.topo.bathy.200411
 * 437M   bmng.topo.bathy.200412
 * 7.9G   hurricane_katrina
 * 43G    hurricane_katrina.ace
 * 1.8G   hurricane_ophelia.noaa
 * 4.5G   hurricane_rita.noaa
 * 137M   ri
 * 147M   RobbenIsland
 * 80G    us.westvirginia_wvsamb2003_0.6m
 * 775M   geocoder  -- Again, not being used?
 * 4.0K   bench
 * 4.0K   geocode_benchmark.pl
 * 4.0K   geocode_cli.pl
 * 4.0K   list.txt
 * 4.0K   resp.txt
 * 4.0K   test.php
 * 775M   tiger2004.db
 * 246M   linux-2.6.15.5
 * Various files
 * 39M    linux-2.6.15.5.tar.bz2
 * 1.5G   log -- Why dont we offload these to somewhere, as they're just old logs?
 * 1.3G   www
 * 148M   www_wwc_lighttpd
 * 31G    nrcs  -- I Assume these are in prep to be processed?
 * Various imagery files
 * 12G    work  -- Lots of stuff in here, didnt bother going through
 * Various files (Nowaks?)

/1

 * 12G    africa250k -- Madmappers Africa250k
 * 22G    a.tar -- Looks like old files from pinky, deletable?
 * 49M    aw -- AWstats files
 * 1.5G   b.tar -- Looks like old files from pinky, deletable?
 * 34G    cachepacks -- WWD Cache packs
 * 1.5G   c.tar -- Looks like old files from pinky, deletable?
 * 1.5G   data -- Seems to be a redundant copy of /0/logs, Same issue.
 * 134G   datasets
 * 14G    us.alabama.birmingham_mar2002_seamless23002hz
 * 6.4G   us.alaska.anchorage_sep2002_seamless22102hz
 * 2.2G   us.florida.pasco
 * 4.8G   us.idaho.boise_apr2003_seamless23202hz
 * 9.2G   us.louisiana.batonrouge_mar2002_seamless22902hz
 * 2.1G   us.maine.augusta_mar2003_seamless22402hz
 * 8.8G   us.maryland.baltimore-annapolis_oct2002-jan2003_seamless22702hz
 * 4.2G   us.nevada.carsoncity_jul2003_seamless23702hz
 * 11G    us.nevada.lasvegas-mesquite_sep2003_seamless22402hz
 * 13G    us.newmexico.albuquerque_mar2002_seamless21802hz
 * 20G    us.newmexico.albuquerque_mar2004_seamless21a02hz
 * 24G    us.northcarolina.greensboro-winstonsalem_mar2002_seamless26402hz
 * 8.9G   us.ohio.cincinnati_jun2003_seamless24402hz
 * 963M   us.pennsylvania.allentown-bethlehem_feb-apr2002_seamless21902hz
 * 3.6G   us.texas.amarillo_apr2002_seamless22002hz
 * 4.2G   us.texas.austin_apr2002_seamless22502hz


 * 459M   d.tar -- Looks like old files from pinky, deletable?
 * 35M    e.tar -- Looks like old files from pinky, deletable?
 * 35M    root -- Looks like old files from pinky, deletable?
 * 470M   tiles
 * 473M   usr -- backup?
 * 1.5G   var -- backup?
 * 14G    work --Clean / deletable?
 * Various files
 * 6.8G   www -- Looks like old files from pinky, deletable?
 * 560M   www_wwc -- Looks like old files from pinky, deletable?
 * 8.0K   www_wwc_chatcgi -- Looks like old files from pinky, deletable?

/home

 * 12K    adolph_ne.aux
 * 4.0K   adolph_ne.sdw
 * 20M    adolph_ne.sid
 * 13M    adolph_ne.tif
 * 4.0K   adolph_ne.txt
 * 20M    adolph_ne.zip
 * 1.8G   backup
 * 1011M  bbcclimate
 * 3.5M   bbcclimate.sh
 * 31M    bluefield.zip
 * 23G    datasets
 * 2.7M   au.westaustralia_grav2004
 * 33M    au.westaustralia_mag2005
 * 1.1G   au.westaustralia_topo
 * 281M   bmng.topo.bathy.200401
 * 455M   bmng.topo.bathy.200401_merchq
 * 0      bmng.topo.bathy.200401_merclq
 * 2.0M   coverage
 * 3.2G   landsat
 * 448M   nz_linz1994_2.5m
 * 1.9G   nz_linz1995_2.5m
 * 1.2G   nz_linz1996_2.5m
 * 164M   nz_linz1997_2.5m
 * 1.6G   nz_linz1998_2.5m
 * 1.4G   nz_linz1999_2.5m
 * 3.8G   nz_linz2000_2.5m
 * 1.9G   nz_linz2001_2.5m
 * 2.5G   nz_linz2002_2.5m
 * 1.3G   nz_linz2003_2.5m
 * 1.3G   nz_linz2004_2.5m
 * 28M    test
 * 1.7M   test2


 * 3.3M   fairmont_east.zip
 * 434M   forum
 * 0      ftp
 * 775M   geocoder
 * 54M    geoserver
 * 30M    geoserver-1.3.0a-src.zip
 * 1.3G   haw
 * 12K    llynix
 * 8.0K   mapserv
 * 12K    maurizio
 * 19G    mwilkie
 * 1.2G   mysql
 * 12K    nosilleg
 * 3.9G   nowak
 * 0      rails
 * 987M   root
 * 0      srtm
 * 17M    test2
 * 14M    torrent
 * 12K    user
 * 124G   work
 * 5.9M   wvgeol.zip
 * 20G    www
 * 12K    yeogeoorg

/0

 * 2.1G   au.westaustralia_geology_250k
 * 4.0K   config.php
 * 36M    test -- Test dataset of some sort?
 * 37G    us.florida_2004_1m
 * 23G    us.indiana_naip2003_1m
 * 38G    us.massachusetts_massgis2001_0.5m
 * 14G    us.montana_nsdi2004_0.3m
 * 9.3G   us.newyork_nysdop2001_0.3m
 * 12G    us.newyork_nysdop2002_0.3m
 * 21G    us.newyork_nysdop2003_0.3m
 * 31G    us.newyork_nysdop2004_0.15m
 * 26G    us.newyork_nysdop2004_0.3m
 * 2.4G   us.newyork_nysdop2004_0.6m
 * 137M   za.robbenisland_0.5m

/1

 * 399M 0.es_1990_jpg -- We can probably remove this stuff if we need space, layer copy from nlt
 * 502M 0.nlt_pseudo -- (see 0.es_1990_jpg)
 * 1.6G 1.es_1990_jpg -- (see 0.es_1990_jpg)
 * 1.8G 1.nlt_pseudo -- (see 0.es_1990_jpg)
 * 6.3G 2.es_1990_jpg -- (see 0.es_1990_jpg)
 * 6.7G 2.nlt_pseudo -- (see 0.es_1990_jpg)
 * 746M aptcache -- /var/cache/apt was maxing out /var so moved
 * 54G cachepacks -- WWD Cache packs, needs to be cleaned
 * 172M eogeo -- Can be removed, we no longer host eogeo.
 * 21G mwilkie -- Original upload of CDEM
 * 7.5G worldwind28.arc.nasa.gov -- Copy of BMNG from worldwind28
 * 4.0K wwcbackup

/2

 * 24G 3.es_1990_jpg
 * 84G 4.es_1990_jpg
 * 2.2G ftcoll
 * 2.1G ftcoll.tar
 * 100M layers
 * 6.5G log
 * 68G sa50k
 * 0 tmp
 * 810M va-naip-partial
 * 170M world.200401.3x21600x21600.A1.png
 * 34G wwc_backup_fromt1

Storage1
(Note: This server is owned by Matt Mills, anything marked "Personal" is his.)

/store

 * 22G    backup -- Personal
 * 12G    backups -- Personal
 * 24G    bmng -- Tiled BMNG thats used in WW + Cache packs
 * 33M    boinc -- BOINC files
 * 92M    cache
 * 309M   cachescripts
 * 4.6M   cisco -- Personal
 * 12G    clementine30xx -- Clementine data thats used in WW + Cache Packs
 * 191G   cluster -- Files the cluster uses for booting.
 * 8.0K   alloctest
 * 4.0K   alloctest.c
 * 4.0K   build_initrd
 * 64K    dev.tar.gz
 * 187G   home -- Can we clean this up at all? Lots of data thats doing nothing atm.
 * 488M   boinc
 * 605K   dnetc496-linux-x86-elf-uclibc
 * 2.1G   done
 * 137G   processing
 * 49G    srcData
 * 0      tmp
 * 91M    initrd
 * 375M   NewYork
 * 256M   packages
 * 2.6G   root
 * 128M   root.tar


 * 28K    convert -- tiling script (no longer in use)
 * 3.8G   diskbackups -- Personal
 * 0      dstmp
 * 37G    fl -- Tiles of somewhere in florida, can we rm this?
 * 4.6G   garbuttny -- Historic maps that nelson was going to process
 * 12G    geocover2000 -- Geocover2000 data thats used in ww + cache packs
 * 2.5G   imagery -- Imagery I've bought (two counties in FL)
 * 6.3G   JHB_Ortho_Proces -- Johannesburg Orthophotos from Maurizio
 * 143M   log-nlt-cluster-usage.zip -- Log Jessi sent me a while back for testing
 * 28K    master -- see "convert"
 * 441K   maurizio
 * 28G    mwilkie -- CDEMs
 * 53M    mysql
 * 60G    nasa1 -- Backup of some data on nasa1.us.archive.org
 * 168K   ncd -- Personal
 * 372G   nlt
 * 536G   seamless
 * 613K   sig -- Personal
 * 90G    srtm -- SRTM3arcsecv2, srtm30plus, usgsNED
 * 61G    Storage -- Personal
 * 3.6G   swazi -- swaziland orthophotos from Maurizio
 * 449M   temp
 * 4.3G   tiger -- Tiger/LINE 2004 data
 * 5.0M   tivo -- Personal
 * 1.5G   wa -- West Australia data (Prob can delete?)
 * 11G    wa-topo -- West Australia data (Prob can delete?)
 * 8.0K   wms.php
 * 20M    wrobben -- wrobben isle data from Maurizio

/data/0

 * 6.3G   backup
 * 150G   ca
 * 2.0G   calif
 * 6.3G   johannesburg
 * 14G    nrcs
 * 180G   ny
 * 69G    ny2
 * 21G    ny3
 * 1.1M   ny4
 * 4.0K   process
 * 4.0K   process_mrsid
 * 257M   root2.img
 * 0      rst0
 * 4.0K   seamless_22202HZ
 * 799M   seamless_23302HZ
 * 0      seamless_24002HZ
 * 57G    seamless_24102HZ
 * 560M   seamless_24302HZ
 * 56G    seamless_24402HZ
 * 54G    seamless_24502HZ
 * 31G    seamless_24602HZ
 * 26G    seamless_OCL02HZ
 * 14G    seamless_OCM02HZ
 * 0      source
 * 38G    storage1transfer
 * 148M   tivobackup
 * 0      tpk
 * 7.1G   vt

/data/1

 * 4.0K   compress
 * 1.1G   img
 * 4.0K   prepare_seamless
 * 4.0K   process
 * 4.0K   process2
 * 162G   seamless_21A02HZ -- processed seamless data, waiting to be tpk'd (?)
 * 1.1G   watopo  -- Attempt to convert from nowak's tile format to wwcache
 * 1.1G   watopo_wwcache -- See Above