aboutsummaryrefslogtreecommitdiffstats
path: root/test/group.yaml
diff options
context:
space:
mode:
authorMatěj Cepl <mcepl@redhat.com>2014-01-02 16:48:57 +0100
committerMatěj Cepl <mcepl@redhat.com>2014-01-02 16:48:57 +0100
commit80f10eaaf784db7c0dfa04ed8917f98aac60eff0 (patch)
tree06c4351c0b53bb795925ca9db5d2fa3673663582 /test/group.yaml
parent4b3df4fabb92dab4028cb794de897eaf3b8fde82 (diff)
downloadgg_scraper-80f10eaaf784db7c0dfa04ed8917f98aac60eff0.tar.gz
For each group generate also a list of all mangled addresses.
Google Groups (rightly) protects addresses against spammers. There is (obviously) no way how to find true value of these addresses programmatically, so we just generate list of all affected ones, which could be later completed with true values (collected somehow) and fixed by some other script. Fixes #275
Diffstat (limited to 'test/group.yaml')
-rw-r--r--test/group.yaml12
1 files changed, 6 insertions, 6 deletions
diff --git a/test/group.yaml b/test/group.yaml
index 44cac25..59a33d4 100644
--- a/test/group.yaml
+++ b/test/group.yaml
@@ -5,7 +5,7 @@ topics:
- !!python/object:gg_scrapper.Topic
articles:
- !!python/object:gg_scrapper.Article {raw_message: "From scho...@schovi.cz Thu Jan\
- \ 2 15:15:33 2014\nReceived: by 10.224.192.193 with SMTP id dr1mr1092656qab.9.1306595926917;\n\
+ \ 2 16:12:04 2014\nReceived: by 10.224.192.193 with SMTP id dr1mr1092656qab.9.1306595926917;\n\
\ Sat, 28 May 2011 08:18:46 -0700 (PDT)\nX-BeenThere: javascriptcz@googlegroups.com\n\
Received: by 10.224.187.145 with SMTP id cw17ls698645qab.2.gmail; Sat, 28 May\n\
\ 2011 08:18:45 -0700 (PDT)\nMIME-Version: 1.0\nReceived: by 10.224.205.130\
@@ -26,7 +26,7 @@ topics:
- !!python/object:gg_scrapper.Topic
articles:
- !!python/object:gg_scrapper.Article {raw_message: "From richte...@gmail.com Thu\
- \ Jan 2 15:15:35 2014\nReceived: by 10.224.136.200 with SMTP id s8mr198006qat.21.1306398867334;\n\
+ \ Jan 2 16:12:06 2014\nReceived: by 10.224.136.200 with SMTP id s8mr198006qat.21.1306398867334;\n\
\ Thu, 26 May 2011 01:34:27 -0700 (PDT)\nX-BeenThere: javascriptcz@googlegroups.com\n\
Received: by 10.224.187.145 with SMTP id cw17ls261575qab.2.gmail; Thu, 26 May\n\
\ 2011 01:34:26 -0700 (PDT)\nMIME-Version: 1.0\nReceived: by 10.224.32.129 with\
@@ -47,7 +47,7 @@ topics:
\ v=B9echny stejn=EC (hnusn=EC) a bylo to t=EC=BEkop=E1dn=\n=FD.\n\nhttp://blog.sproutcore.com/announcing-sproutcore-2-0/\n\
\n", root: 'https://groups.google.com/forum/message/raw?msg=javascriptcz/-4cy0XTGGaU/pUoGBDjK_HcJ'}
- !!python/object:gg_scrapper.Article {raw_message: "From damn...@gmail.com Thu Jan\
- \ 2 15:15:36 2014\nReceived: by 10.100.168.2 with SMTP id q2mr1217945ane.14.1306495789592;\n\
+ \ 2 16:12:07 2014\nReceived: by 10.100.168.2 with SMTP id q2mr1217945ane.14.1306495789592;\n\
\ Fri, 27 May 2011 04:29:49 -0700 (PDT)\nX-BeenThere: javascriptcz@googlegroups.com\n\
Received: by 10.90.58.22 with SMTP id g22ls443766aga.2.gmail; Fri, 27 May 2011\n\
\ 04:29:49 -0700 (PDT)\nMIME-Version: 1.0\nReceived: by 10.90.1.10 with SMTP\
@@ -72,7 +72,7 @@ topics:
\ stejn=EC (hnusn=EC) a bylo to t=EC=BEkop=E1d=\nn=FD.\n>\n> http://blog.sproutcore.com/announcing-sproutcore-2-0/\n\
\n", root: 'https://groups.google.com/forum/message/raw?msg=javascriptcz/-4cy0XTGGaU/Gxus9ddtp5wJ'}
- !!python/object:gg_scrapper.Article {raw_message: "From richte...@gmail.com Thu\
- \ Jan 2 15:15:36 2014\nReceived: by 10.224.9.144 with SMTP id l16mr693260qal.26.1306497361290;\n\
+ \ Jan 2 16:12:07 2014\nReceived: by 10.224.9.144 with SMTP id l16mr693260qal.26.1306497361290;\n\
\ Fri, 27 May 2011 04:56:01 -0700 (PDT)\nX-BeenThere: javascriptcz@googlegroups.com\n\
Received: by 10.224.175.74 with SMTP id w10ls508844qaz.0.gmail; Fri, 27 May\n\
\ 2011 04:56:01 -0700 (PDT)\nMIME-Version: 1.0\nReceived: by 10.224.186.16 with\
@@ -112,7 +112,7 @@ topics:
- !!python/object:gg_scrapper.Topic
articles:
- !!python/object:gg_scrapper.Article {raw_message: "From richte...@gmail.com Thu\
- \ Jan 2 15:15:39 2014\nReceived: by 10.224.126.72 with SMTP id b8mr1923833qas.13.1306351509553;\n\
+ \ Jan 2 16:12:09 2014\nReceived: by 10.224.126.72 with SMTP id b8mr1923833qas.13.1306351509553;\n\
\ Wed, 25 May 2011 12:25:09 -0700 (PDT)\nX-BeenThere: javascriptcz@googlegroups.com\n\
Received: by 10.224.181.131 with SMTP id by3ls169717qab.3.gmail; Wed, 25 May\n\
\ 2011 12:25:08 -0700 (PDT)\nMIME-Version: 1.0\nReceived: by 10.224.203.8 with\
@@ -130,7 +130,7 @@ topics:
- !!python/object:gg_scrapper.Topic
articles:
- !!python/object:gg_scrapper.Article {raw_message: "From richte...@gmail.com Thu\
- \ Jan 2 15:15:40 2014\nReceived: by 10.224.215.3 with SMTP id hc3mr1823425qab.4.1306325120198;\n\
+ \ Jan 2 16:12:10 2014\nReceived: by 10.224.215.3 with SMTP id hc3mr1823425qab.4.1306325120198;\n\
\ Wed, 25 May 2011 05:05:20 -0700 (PDT)\nX-BeenThere: javascriptcz@googlegroups.com\n\
Received: by 10.224.138.148 with SMTP id a20ls76694qau.5.gmail; Wed, 25 May\n\
\ 2011 05:05:20 -0700 (PDT)\nMIME-Version: 1.0\nReceived: by 10.224.217.200\