common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	819117	application/xhtml+xml	67.205.3.89	0	0	14	0	0	0	0	0	0	0	0	text/html	27784	html-mf-xfn	1328767358000	14	http://www.chsglobe.com/tag/carolyn-blair/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	951789	application/xhtml+xml	184.172.171.170	0	0	0	0	0	0	0	0	74	0	0	text/html	52523	html-mf-xfn	1328767359000	74	http://robyngough.com/2009/03/17/its-no-blarney-sale/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	1107477	text/html	62.149.195.44	0	0	5	0	0	0	0	0	0	0	0	text/html	45967	html-mf-hcard	1328767360000	5	http://www.palermoanimali.it/ViewProfile-eugenia.html
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	1597022	application/xhtml+xml	64.14.74.38	0	0	9	0	0	0	0	0	0	0	0	text/html	23109	html-mf-hcard	1328767361000	9	http://cascadebicyclestudio.com/2006/08/seven-test-bikes-for-sale/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	1619856	application/xhtml+xml	184.172.252.137	0	0	6	0	0	0	0	0	0	0	0	text/html	29997	html-mf-hcard	1328767361000	6	http://thebestmusicblog.com/in-this-land/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	2508028	text/html	67.205.37.206	0	0	24	0	0	0	0	0	0	0	4	text/html	36334	html-mf-hcard	1328767387000	28	http://eoid.org/tag/kabab/page/2/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	2896187	application/xhtml+xml	69.195.97.151	0	0	0	0	0	0	0	0	4	0	0	text/html	27124	html-mf-xfn	1328767387000	4	http://www.noahhowell.com/2009/02/why-not-sober-up-in-the-y-not/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	2999134	application/xhtml+xml	208.84.154.17	0	0	0	0	0	0	0	0	0	0	4	text/html	12250	html-rdfa	1328767384000	4	http://www.newcircle.com.au/news/2010/05/marcus-reich-gravity-edit/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	3765008	application/xhtml+xml	77.232.92.12	0	0	0	0	0	0	0	0	174	0	0	text/html	32063	html-mf-xfn	1328767385000	174	http://spxl.tv/2008/09/03/mind-reggae-dubstep/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	4303841	text/html	50.22.90.97	0	0	70	0	0	0	0	0	0	0	0	text/html	34754	html-mf-xfn	1328767384000	70	http://www.thebiblequotes.com/page/16
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	4315637	application/xhtml+xml	63.108.88.105	0	0	0	0	0	0	0	0	0	4	0	text/html	132591	html-microdata	1328767384000	4	http://store.inkjetcarts.us/i-series-c165.aspx
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	4455032	application/xhtml+xml	50.22.66.127	0	0	14	0	0	0	0	0	0	0	0	text/html	49569	html-mf-xfn	1328767384000	14	http://jagonews.com/2010/08/mazhar-majeed-released-on-bail-how-a-reporter-becomes-bookie/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	4654890	application/xhtml+xml	64.87.13.220	0	0	0	0	0	0	0	0	0	0	2	text/html	62258	html-rdfa	1328767384000	2	http://www.ipsb.edu/about-ipsb/our-people/instructors/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	5630618	text/html	216.35.196.77	0	0	28	0	0	0	0	0	0	0	0	text/html	9163	html-mf-xfn	1328767383000	28	http://stephlewis.com/2004/10/man/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	5633563	text/html	66.147.242.173	0	0	0	0	0	0	0	0	0	0	13	text/html	45219	html-rdfa	1328767383000	13	http://jessicamullen.com/2010/06/04/learning-with-lifestreaming-17-lifestreaming-the-law-of-attraction/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	5744230	text/html	89.30.106.44	0	0	0	0	0	0	0	0	0	0	3	text/html	22345	html-rdfa	1328767381000	3	http://www.convention-collective-plasturgie.fr/convention-collective-plasturgie-c292/organisation-duree-temps-travail-t5682141/reduction-duree-travail-formation-s5726473/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	5766754	text/html	50.22.107.97	0	0	7	0	0	0	0	0	0	0	0	text/html	26456	html-mf-xfn	1328767381000	7	http://lowcarbdietplans.low-carb-diet-planner.com/tag/going-low-carb-and-loving-it/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	6557304	application/xhtml+xml	72.167.68.125	0	0	3	0	0	0	0	0	0	0	0	text/html	43279	html-mf-hcard	1328767381000	3	http://www.fireflygn.com/Gold-Luncheon-Napkin-50Ct-GLD50LCNP-PP.htm
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	6881862	application/xhtml+xml	50.23.110.233	0	0	6	0	0	0	0	0	0	0	0	text/html	34509	html-mf-hcard	1328767379000	6	http://www.topratedautoinsurancecompanies.com/tag/car-insurance-comparisons/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	8265636	application/xhtml+xml	202.172.26.8	0	0	0	0	0	0	0	0	4	0	0	text/html	32291	html-mf-xfn	1328767363000	4	http://www.ito-rhythm.com/iphone/448.html
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	8291802	application/xhtml+xml	174.132.89.99	0	0	6	0	0	0	0	0	0	0	0	text/html	33080	html-mf-hcard	1328767364000	6	http://www.thevirtualasst.com/stickybits-tag-your-world%e2%84%a2
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	8555340	application/xhtml+xml	208.84.154.17	0	0	0	0	0	0	0	0	0	0	3	text/html	38200	html-rdfa	1328767361000	3	http://www.newcircle.com.au/news/category/product-highlight/page/3/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	8598274	application/xhtml+xml	63.108.88.105	0	0	0	0	0	0	0	0	0	4	0	text/html	359000	html-microdata	1328767362000	4	http://store.inkjetcarts.us/pro-9600-c591.aspx
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	10593557	application/xhtml+xml	69.163.136.29	0	0	60	0	0	0	0	0	0	0	0	text/html	52985	html-mf-hcard	1328767361000	60	http://www.parkeoloji.com/catalhoyuklulerin-atalari/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	10668509	text/html	50.22.90.97	0	0	56	0	0	0	0	0	0	0	0	text/html	32477	html-mf-xfn	1328767361000	56	http://www.thebiblequotes.com/page/18
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	10863430	application/xhtml+xml	67.227.133.188	0	0	0	0	0	0	0	0	0	0	8	text/html	32932	html-rdfa	1328767361000	8	http://search.doctoralia.in/oncology/4
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	10891269	text/html	67.205.37.206	0	0	6	0	0	0	0	0	0	0	4	text/html	30365	html-mf-hcard	1328767360000	10	http://eoid.org/tag/lodhi-colony/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	11424817	application/xhtml+xml	64.87.13.220	0	0	0	0	0	0	0	0	0	0	2	text/html	29919	html-rdfa	1328767360000	2	http://www.ipsb.edu/admissions/admissions-eligibility/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	11554168	text/html	89.30.106.44	0	0	0	0	0	0	0	0	0	0	3	text/html	22444	html-rdfa	1328767360000	3	http://www.convention-collective-plasturgie.fr/convention-collective-plasturgie-c292/dispositions-particulieres-personnel-encadrement-t5682060/date-application-s5726306/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	11763799	application/xhtml+xml	173.236.136.14	0	0	0	0	0	0	0	0	0	0	11	text/html	6693	html-rdfa	1328767360000	11	http://www.stacieturnerphotography.com/blog/tag/newborn/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	11855300	text/html	69.163.230.119	0	0	0	0	0	0	0	0	26	0	0	text/html	25831	html-mf-xfn	1328767360000	26	http://seecreatures.com/tag/stella-mccartney/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	12018409	application/xhtml+xml	72.167.68.125	0	0	3	0	0	0	0	0	0	0	0	text/html	44993	html-mf-hcard	1328767359000	3	http://www.fireflygn.com/I-Carly-Edible-Icing-Art-EDARICARLY-PP.htm
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	12162109	application/xhtml+xml	217.64.195.223	0	0	0	0	0	0	0	0	60	0	0	text/html	27258	html-mf-xfn	1328767366000	60	http://www.sukkology.net/blog/2006/05/23/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	12179833	text/html	98.129.229.53	0	0	64	0	0	0	0	0	0	0	0	text/html	67718	html-mf-xfn	1328767382000	64	http://epicbattleaxe.com/rant-gamestopitplease/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	12223903	application/xhtml+xml	74.84.203.173	0	0	16	0	0	0	0	0	0	0	1	text/html	85797	html-mf-hcard	1328767373000	17	http://dailyiowegian.com/local/x546122586/Centerville-City-Council-to-meet-tonight
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	12255878	text/html	199.204.137.111	0	0	0	0	0	0	0	0	22	0	0	text/html	66936	html-mf-xfn	1328767380000	22	http://www.gilsmethod.com/how-to-unload-unused-dlls-to-regain-memory-in-windows-xp
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	12294089	application/xhtml+xml	62.233.114.118	0	0	0	0	0	0	0	0	0	0	6	text/html	62465	html-rdfa	1328767370000	6	http://www.stalbansreview.co.uk/news/2006.0/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	12348880	application/xhtml+xml	66.147.242.83	0	0	0	0	0	0	0	0	0	0	1	text/html	37941	html-rdfa	1328767372000	1	http://realblogging.com/stefan-swanepoel/real-estate-industry-update-homeaway-acquires-escapehomes/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	12437768	application/xhtml+xml	80.239.169.97	0	0	0	0	0	0	0	0	0	0	1	text/html	53991	html-rdfa	1328767369000	1	http://www.finanzablog.it/user/thesneezer
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	12993089	application/xhtml+xml	97.74.26.1	0	0	0	0	0	0	0	0	4	0	0	text/html	36433	html-mf-xfn	1328767378000	4	http://www.apoliticus.com/2009/04/queen-in-a-bad-mood-tells-berlusconi-to-pipe-down/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	13061412	application/xhtml+xml	190.228.29.85	0	0	0	0	0	0	0	0	104	0	0	text/html	74144	html-mf-xfn	1328767359000	104	http://noticiasinformales.com/2008/08/la-lucha-del-acosta-la-lucha-de-todos.html/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	13076551	application/xhtml+xml	95.174.24.131	0	0	14	0	0	0	0	0	0	0	0	text/html	38551	html-mf-hcard	1328767361000	14	http://www.casahelp.com/salute-e-benessere/con-il-guerrilla-gardening-il-giardinaggio-diventa-politico/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	13158286	application/xhtml+xml	95.174.24.131	0	0	66	0	0	0	0	0	0	0	0	text/html	48097	html-mf-hcard	1328767386000	66	http://www.casahelp.com/gestione-manutenzione/alcuni-suggerimenti-per-togliere-le-macchie/comment-page-1/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	13170156	application/xhtml+xml	190.228.29.85	0	0	0	0	0	0	0	0	104	0	0	text/html	89526	html-mf-xfn	1328767387000	104	http://noticiasinformales.com/2008/06/hoy-nos-despertamos-con-la-noticia-de.html/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	13273385	application/xhtml+xml	81.169.145.150	0	0	7	0	0	0	0	0	0	0	0	text/html	26435	html-mf-xfn	1328767375000	7	http://www.inmeinerstrasse.de/blog/tag/marzahn/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	13280920	application/xhtml+xml	50.56.22.177	0	0	0	0	0	0	0	0	0	0	3	text/html	47376	html-rdfa	1328767377000	3	http://www.bikes.com.au/c/256014/1/2010-radius.html
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	13310853	application/xhtml+xml	194.9.95.116	0	0	37	0	0	0	0	0	0	0	0	text/html	93879	html-mf-hcard	1328767382000	37	http://elingrelsson.se/2009/03/28/man-kan-inte-valdtas/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	13328447	text/html	68.233.241.127	0	0	14	0	0	0	0	0	0	0	0	text/html	40674	html-mf-xfn	1328767368000	14	http://ponselhandphone.com/tag/ponsel-chatting/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	13374634	application/xhtml+xml	74.220.215.215	0	0	0	0	0	0	0	0	0	0	5	text/html	23896	html-rdfa	1328767380000	5	http://www.hopelesslyflawed.com/tag/mint-julep/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	13506907	application/xhtml+xml	184.168.176.1	0	0	63	0	0	0	0	0	0	0	0	text/html	91292	html-mf-hcard	1328767365000	63	http://vremeigre.com/3d-cestitka-sa-srcima.html
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	13960025	text/html	98.129.178.208	0	0	90	0	0	0	0	0	0	0	0	text/html	49551	html-mf-hcard	1328767377000	90	http://www.bignickel-sparkstribune.com/view/full_story/8850649/article-Former-Nev--Gov--Guinn-dead-in-Las-Vegas
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	13984443	application/xhtml+xml	69.89.27.238	0	0	30	0	0	0	0	0	0	0	0	text/html	90024	html-mf-hcard	1328767385000	30	http://monikamcgillicuddy.com/wordpress/tag/atkinson-nh-market-report/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	14555987	text/html	173.245.60.82	0	0	0	0	0	0	0	0	0	0	6	text/html	53034	html-rdfa	1328767374000	6	http://www.justofficechairs.com/commercial-buyer-program/32-gallon-square-receptacle
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	15108047	application/xhtml+xml	66.147.242.85	0	0	91	0	0	0	0	0	0	0	0	text/html	72920	html-mf-hcard	1328767375000	91	http://blog.muscle-build.com/45988/special-school-bodybuilding-material/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	15166896	text/html	97.74.141.1	0	0	7	0	0	0	0	0	0	0	6	text/html	30234	html-mf-xfn	1328767385000	13	http://poponandon.com/tag/andy-carr-show
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	15337058	application/xhtml+xml	199.204.248.106	0	0	0	0	0	0	0	0	0	0	7	text/html	51023	html-rdfa	1328767364000	7	http://www.nauinet.co.jp/blog2/archives/1998/05/post-2.html
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	15458596	text/html	184.172.213.138	0	0	0	0	0	0	0	0	0	0	67	text/html	208183	html-rdfa	1328767367000	67	http://www.aedrx.info/philips-onsite-aed-defibrillator-quick-order-package/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	15543860	text/html	69.89.31.181	0	0	0	0	0	0	0	0	14	0	0	text/html	46387	html-mf-xfn	1328767374000	14	http://donkeywest.com/2010/06/19/the-independence-of-love/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	15666160	application/xhtml+xml	199.204.248.106	0	0	0	0	0	0	0	0	0	0	7	text/html	28049	html-rdfa	1328767386000	7	http://www.nauinet.co.jp/blog2/archives/2007/09/2007-4.html
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	16024219	text/html	94.124.197.56	0	0	0	0	0	0	0	0	0	0	10	text/html	107667	html-rdfa	1328767365000	10	http://www.themoscowtimes.com/news/article/soviet-political-cartoonist-yefimov-dead-at-108/371385.html
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	16052154	application/xhtml+xml	97.74.180.128	0	0	175	0	0	0	0	0	0	0	0	text/html	55521	html-mf-hcard	1328767369000	175	http://www.mobilewirelessphone.com/2010/02/06/nokia-photo-browser-beta-labs/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	16129270	application/xhtml+xml	94.228.36.2	0	0	10	0	0	0	0	0	0	0	0	text/html	53886	html-mf-hcard	1328767374000	10	http://www.touchliverpool.com/business/list/bid/4747361
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	16238345	application/xhtml+xml	164.109.40.120	0	0	0	0	0	0	0	0	0	0	7	text/html	89117	html-rdfa	1328767366000	7	http://www.gomemphis.com/news/2009/nov/06/no-headline---2009-11-05-095820482508/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	16282558	application/xhtml+xml	141.242.248.222	0	0	0	0	0	0	0	0	0	0	7	text/html	48341	html-rdfa	1328767372000	7	http://www.valleymorningstar.com/articles/donna-66380-funerals-january.html
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	16356114	application/xhtml+xml	173.201.39.183	0	0	0	0	0	0	0	0	0	0	5	text/html	47970	html-mf-xfn	1328767373000	5	http://iamkoream.com/gotv/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	16445967	application/xhtml+xml	205.139.40.93	0	0	10	0	0	0	0	0	0	0	0	text/html	54258	html-mf-hcard	1328767368000	10	http://www.vaildaily.com/article/20041230/NEWS/112300012
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	16488161	application/xhtml+xml	63.240.213.244	0	0	16	0	0	0	0	0	0	0	7	text/html	64549	html-mf-hcard	1328767359000	23	http://www.kiowacountysignal.com/obituaries/x1517281790/Becklund-memorial-service-set-for-Friday-in-Pratt
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	16550109	application/xhtml+xml	84.45.105.136	0	0	11	0	0	0	0	0	0	0	0	text/html	52324	html-mf-hcard	1328767375000	11	http://www.touchhereford.com/business/list/bid/2269146
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	17093818	text/html	208.82.16.68	0	0	30	0	0	0	0	0	0	0	0	text/html	76799	html-mf-hcard	1328767408000	30	http://www.thenetworkonline.org/profile/SusanYoung
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	17145942	application/xhtml+xml	98.136.92.79	0	0	0	0	0	0	0	0	6	0	0	text/html	37758	html-mf-xfn	1328767390000	6	http://www.rashtrakut.com/blog/2009/11/08/spreading-creationism-abroad/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	17157324	application/xhtml+xml	98.136.92.79	0	0	0	0	0	0	0	0	6	0	0	text/html	34243	html-mf-xfn	1328767415000	6	http://www.rashtrakut.com/blog/2009/12/04/literally-from-rags-to-riches/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	17226378	text/html	76.74.255.123	0	0	0	0	0	0	0	0	138	0	0	text/html	73791	html-mf-xfn	1328767410000	138	http://banannery.com/tag/satire/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	17244808	application/xhtml+xml	74.200.243.251	0	0	216	0	0	0	0	0	0	0	0	text/html	78503	html-mf-hcard	1328767401000	216	http://penguingeneration.com/2010/08/08/most-comments-in-a-week-award/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	17262507	application/xhtml+xml	76.74.255.123	0	0	0	0	0	0	0	0	34	0	0	text/html	30781	html-mf-xfn	1328767390000	34	http://icanhazdot.net/tag/teched/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	17272607	application/xhtml+xml	76.74.255.123	0	0	0	0	0	0	0	0	34	0	0	text/html	32352	html-mf-xfn	1328767413000	34	http://icanhazdot.net/2008/10/24/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	17303221	application/xhtml+xml	12.228.94.216	0	0	0	0	0	0	0	0	0	62	1	text/html	36573	html-microdata	1328767399000	63	http://www.mobilealflorist.com/gift-baskets
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	17400363	text/html	213.186.33.16	0	0	0	0	0	0	0	0	0	0	1	text/html	58814	html-rdfa	1328767408000	1	http://www.sinart.asso.fr/3-films-avec-bud-spencer-et-terence-hill-coffret-3-dvd-13215
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	17881341	text/html	208.65.158.3	0	0	0	0	0	0	0	0	0	11	0	text/html	42060	html-microdata	1328767395000	11	http://www.condosatwilliamscentre.com/44/Condominium-at-Williams-Centre-Blog/New-Available-Unit-Unit-10305-has-become-available/New-Available-Unit-Unit-16306-has-become-available
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	17956468	text/html	64.42.222.57	0	0	0	0	0	0	0	0	0	20	0	text/html	55105	html-microdata	1328767415000	20	http://sdhomepro.com/mylistings.html/details-9586207
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	18125499	application/xhtml+xml	72.233.2.58	0	0	0	0	0	0	0	0	18	0	0	text/html	52288	html-mf-xfn	1328767396000	18	http://mundoepm.com.br/2009/11/20/videos-da-project-conference-2009/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	18138595	application/xhtml+xml	76.74.254.120	0	0	0	0	0	0	0	0	18	0	0	text/html	55622	html-mf-xfn	1328767416000	18	http://mundoepm.com.br/2009/09/24/fotos-da-project-conference-2009-2/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	20496683	application/xhtml+xml	202.181.99.36	0	0	7	0	0	0	0	0	0	0	0	text/html	28646	html-mf-hcard	1328767417000	7	http://www.hotstudio.net/serika/blog/2009/12/divinity-2-ego-draconis-part1.html
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	20503331	application/xhtml+xml	184.173.2.186	0	0	0	0	0	0	0	0	0	0	5	text/html	40724	html-rdfa	1328767418000	5	http://www.shreveportrealestateandhomes.com/pending-home-sales-rise-unexpectedly/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	20520723	application/xhtml+xml	65.254.248.134	0	0	56	0	0	0	0	0	4	0	0	text/html	167263	html-mf-xfn	1328767418000	60	http://thekingdomkey.net/forums/user/696-miss-ninja/page__tab__aboutme
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	20788054	application/xhtml+xml	66.228.131.228	0	0	6	0	0	0	0	0	0	0	0	text/html	24871	html-mf-hcard	1328767416000	6	http://www.gloriousfootball.com/tag/bocanegra/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	20813041	application/xhtml+xml	209.236.73.165	0	0	6	0	0	0	0	0	0	0	0	text/html	16792	html-mf-hcard	1328767416000	6	http://www.alexlcohen.com/tag/iphone-analytics/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	21291375	application/xhtml+xml	184.154.228.18	0	0	36	0	0	0	0	0	0	0	0	text/html	64204	html-mf-hcard	1328767417000	36	http://natasha.edcentric.org/2009/12/27/happy-holidays/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	21397202	application/xhtml+xml	67.192.126.212	0	0	0	0	0	0	0	0	8	0	0	text/html	26176	html-mf-xfn	1328767417000	8	http://blog.canvaspress.com/tag/canvas-art/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	21416035	text/html	69.163.243.254	0	0	7	0	0	0	0	0	0	0	0	text/html	12803	html-mf-xfn	1328767417000	7	http://www.darkmessiah.com/assassins-creed-iafricacom/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	21848252	application/xhtml+xml	74.50.0.35	0	0	21	0	0	0	0	0	0	0	0	text/html	26478	html-mf-hcard	1328767417000	21	http://www.asiahealthtourism.com/case-studies-following-on-from-truth-telling-question/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	21966175	application/xhtml+xml	50.18.59.48	0	0	0	0	0	0	0	0	0	0	6	text/html	23062	html-rdfa	1328767415000	6	http://www.philadelphiaflowers.net/p3/3447/Grand_Celebrations_Fruit_and_Wine_Basket-1.html
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	22751446	application/xhtml+xml	118.127.87.28	0	0	0	0	0	0	0	0	0	0	2	text/html	40962	html-rdfa	1328767415000	2	http://www.oasis.com/de/member/vakerox.htm
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	25162794	application/xhtml+xml	174.120.83.157	0	0	0	0	0	0	0	0	0	0	2	text/html	95698	html-mf-hreview	1328767412000	2	http://ipranayam.com/gasacidity-and-constipation/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	25312902	text/html	217.6.129.104	0	0	0	0	0	0	0	0	0	0	3	text/html	38038	html-rdfa	1328767412000	3	http://www.emsland-touristik.de/Ab_aufs_Rad-94-2579-1.html
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	25330674	text/html	193.203.205.226	0	0	5	0	0	0	0	0	0	0	0	text/html	42362	html-mf-hcard	1328767412000	5	http://fitclub.ro/antrenament-culturism-fitness/exercitii-culturism-fitness/fese/fandari-haltera
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	25389185	text/html	174.132.195.34	0	0	0	0	0	0	0	0	6	0	0	text/html	59673	html-mf-xfn	1328767412000	6	http://wsmarketingnews.com/tag/google-adwords/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	25479602	application/xhtml+xml	184.173.193.157	0	0	70	0	0	0	0	0	4	0	0	text/html	32107	html-mf-xfn	1328767410000	74	http://www.peterdorsi.com/category/general/page/10/
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	25571937	application/xhtml+xml	173.248.188.79	0	0	0	0	0	0	0	0	0	0	3	text/html	60112	html-rdfa	1328767410000	3	http://www.platinumlist.ae/gallery/item/273/DJ_Magazine_Party_feat_AMIN_GOLESTAN_AFROBOOGIE.html
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	25621473	application/xhtml+xml	212.36.82.32	0	0	0	0	0	0	0	0	40	0	0	text/html	27430	html-mf-xfn	1328767410000	40	http://www.netdancerplanet.info/2007/01/guapas-pixeladas.html
common-crawl/parse-output/segment/1346823845675/1346864466526_10.arc.gz	25656249	application/xhtml+xml	113.33.195.32	0	0	0	0	0	0	0	0	0	0	5	text/html	27807	html-rdfa	1328767411000	5	http://brushcutter.shop-niche.co.jp/2010/05/post-65d5.html
