Compare commits

...

11 Commits

Author SHA1 Message Date
cbe027d5e9 Remove IDE files from repository (.idea) 2026-01-01 14:02:22 +01:00
8fee3d27a7 reporter 2026-01-01 13:58:17 +01:00
178f93624e z230 2025-12-31 07:00:27 +01:00
d91e30c3ef Merge remote-tracking branch 'origin/main' 2025-12-31 06:54:21 +01:00
0052b5f125 z230 2025-12-31 06:53:59 +01:00
a3dbc934ed reporter 2025-12-30 18:40:37 +01:00
0f88f0c7d0 Merge remote-tracking branch 'origin/main'
# Conflicts:
#	90 test.py
2025-12-29 23:28:05 +01:00
4678d3fe7f reporter 2025-12-29 06:32:04 +01:00
b39e94a054 Merge remote-tracking branch 'origin/main' 2025-12-29 06:31:31 +01:00
e99d42fa97 Add .gitignore (PyCharm, Python cache) 2025-12-29 05:48:36 +01:00
fdba388228 reporter 2025-12-28 07:19:48 +01:00
887 changed files with 1636851 additions and 53 deletions

3
.idea/.gitignore generated vendored
View File

@@ -1,3 +0,0 @@
# Default ignored files
/shelf/
/workspace.xml

10
.idea/NewsGroups.iml generated
View File

@@ -1,10 +0,0 @@
<?xml version="1.0" encoding="UTF-8"?>
<module type="PYTHON_MODULE" version="4">
<component name="NewModuleRootManager">
<content url="file://$MODULE_DIR$">
<excludeFolder url="file://$MODULE_DIR$/.venv" />
</content>
<orderEntry type="jdk" jdkName="Python 3.12 (NewsGroups)" jdkType="Python SDK" />
<orderEntry type="sourceFolder" forTests="false" />
</component>
</module>

View File

@@ -1,16 +0,0 @@
<component name="InspectionProjectProfileManager">
<profile version="1.0">
<option name="myName" value="Project Default" />
<inspection_tool class="PyCompatibilityInspection" enabled="true" level="WARNING" enabled_by_default="true">
<option name="ourVersions">
<value>
<list size="3">
<item index="0" class="java.lang.String" itemvalue="2.7" />
<item index="1" class="java.lang.String" itemvalue="3.13" />
<item index="2" class="java.lang.String" itemvalue="3.7" />
</list>
</value>
</option>
</inspection_tool>
</profile>
</component>

View File

@@ -1,6 +0,0 @@
<component name="InspectionProjectProfileManager">
<settings>
<option name="USE_PROJECT_PROFILE" value="false" />
<version value="1.0" />
</settings>
</component>

8
.idea/modules.xml generated
View File

@@ -1,8 +0,0 @@
<?xml version="1.0" encoding="UTF-8"?>
<project version="4">
<component name="ProjectModuleManager">
<modules>
<module fileurl="file://$PROJECT_DIR$/.idea/NewsGroups.iml" filepath="$PROJECT_DIR$/.idea/NewsGroups.iml" />
</modules>
</component>
</project>

6
.idea/vcs.xml generated
View File

@@ -1,6 +0,0 @@
<?xml version="1.0" encoding="UTF-8"?>
<project version="4">
<component name="VcsDirectoryMappings">
<mapping directory="$PROJECT_DIR$" vcs="Git" />
</component>
</project>

View File

@@ -15,8 +15,9 @@ def sanitize(value):
# ================= CONFIG ================= # ================= CONFIG =================
GROUP = "alt.binaries.e-book.magazines" GROUP = "alt.binaries.e-book.magazines"
TOTAL_ARTICLES = 50_000_000 TOTAL_ARTICLES = 75_000_000
BATCH_SIZE = 10_000 BATCH_SIZE = 50_000
FIRST=70805000
# ========================================= # =========================================
load_dotenv() load_dotenv()
@@ -43,8 +44,10 @@ with nntplib.NNTP_SSL(
first = int(first) first = int(first)
last = int(last) last = int(last)
start_global = first # start_global = first
end_global = min(first + TOTAL_ARTICLES - 1, last) start_global = FIRST
# end_global = min(first + TOTAL_ARTICLES - 1, last)
end_global = last
print(f"🎯 Target range: {start_global} {end_global}") print(f"🎯 Target range: {start_global} {end_global}")

Binary file not shown.

File diff suppressed because one or more lines are too long

Binary file not shown.

File diff suppressed because it is too large Load Diff

View File

@@ -0,0 +1,3 @@
=ybegin part=1 line=128 size=118119081 name=PC Pro 2011-07.pdf
=ypart begin=1 end=384000
=yend size=384000 part=1 pcrc32=4d91c8dd

Binary file not shown.

View File

@@ -0,0 +1,3 @@
=ybegin part=2 line=128 size=118119081 name=PC Pro 2011-07.pdf
=ypart begin=384001 end=768000
=yend size=384000 part=2 pcrc32=74a7751c

Binary file not shown.

View File

@@ -0,0 +1,3 @@
=ybegin part=3 line=128 size=118119081 name=PC Pro 2011-07.pdf
=ypart begin=768001 end=1152000
=yend size=384000 part=3 pcrc32=51841fc7

Binary file not shown.

View File

@@ -0,0 +1,3 @@
=ybegin part=4 line=128 size=118119081 name=PC Pro 2011-07.pdf
=ypart begin=1152001 end=1536000
=yend size=384000 part=4 pcrc32=93f6f0ed

Binary file not shown.

View File

@@ -0,0 +1,3 @@
=ybegin part=5 line=128 size=118119081 name=PC Pro 2011-07.pdf
=ypart begin=1536001 end=1920000
=yend size=384000 part=5 pcrc32=5a352a85

Binary file not shown.

View File

@@ -0,0 +1,3 @@
=ybegin part=6 line=128 size=118119081 name=PC Pro 2011-07.pdf
=ypart begin=1920001 end=2304000
=yend size=384000 part=6 pcrc32=5076b1b1

Binary file not shown.

View File

@@ -0,0 +1,3 @@
=ybegin part=7 line=128 size=118119081 name=PC Pro 2011-07.pdf
=ypart begin=2304001 end=2688000
=yend size=384000 part=7 pcrc32=94492d58

Binary file not shown.

View File

@@ -0,0 +1,3 @@
=ybegin part=8 line=128 size=118119081 name=PC Pro 2011-07.pdf
=ypart begin=2688001 end=3072000
=yend size=384000 part=8 pcrc32=b6a971c4

Binary file not shown.

View File

@@ -0,0 +1,3 @@
=ybegin part=9 line=128 size=118119081 name=PC Pro 2011-07.pdf
=ypart begin=3072001 end=3456000
=yend size=384000 part=9 pcrc32=a128c523

Binary file not shown.

View File

@@ -0,0 +1,3 @@
=ybegin part=10 line=128 size=118119081 name=PC Pro 2011-07.pdf
=ypart begin=3456001 end=3840000
=yend size=384000 part=10 pcrc32=37cf6bcc

Binary file not shown.

View File

@@ -0,0 +1,3 @@
=ybegin part=11 line=128 size=118119081 name=PC Pro 2011-07.pdf
=ypart begin=3840001 end=4224000
=yend size=384000 part=11 pcrc32=c60f1222

Binary file not shown.

View File

@@ -0,0 +1,3 @@
=ybegin part=12 line=128 size=118119081 name=PC Pro 2011-07.pdf
=ypart begin=4224001 end=4608000
=yend size=384000 part=12 pcrc32=3b74ecd5

Binary file not shown.

View File

@@ -0,0 +1,3 @@
=ybegin part=13 line=128 size=118119081 name=PC Pro 2011-07.pdf
=ypart begin=4608001 end=4992000
=yend size=384000 part=13 pcrc32=115414c5

Binary file not shown.

View File

@@ -0,0 +1,3 @@
=ybegin part=14 line=128 size=118119081 name=PC Pro 2011-07.pdf
=ypart begin=4992001 end=5376000
=yend size=384000 part=14 pcrc32=07b59e1a

Binary file not shown.

View File

@@ -0,0 +1,3 @@
=ybegin part=15 line=128 size=118119081 name=PC Pro 2011-07.pdf
=ypart begin=5376001 end=5760000
=yend size=384000 part=15 pcrc32=94b7ef5b

Binary file not shown.

View File

@@ -0,0 +1,3 @@
=ybegin part=16 line=128 size=118119081 name=PC Pro 2011-07.pdf
=ypart begin=5760001 end=6144000
=yend size=384000 part=16 pcrc32=5895dce4

Binary file not shown.

View File

@@ -0,0 +1,3 @@
=ybegin part=17 line=128 size=118119081 name=PC Pro 2011-07.pdf
=ypart begin=6144001 end=6528000
=yend size=384000 part=17 pcrc32=13de48c8

Binary file not shown.

View File

@@ -0,0 +1,3 @@
=ybegin part=18 line=128 size=118119081 name=PC Pro 2011-07.pdf
=ypart begin=6528001 end=6912000
=yend size=384000 part=18 pcrc32=967b2ba1

Binary file not shown.

View File

@@ -0,0 +1,3 @@
=ybegin part=19 line=128 size=118119081 name=PC Pro 2011-07.pdf
=ypart begin=6912001 end=7296000
=yend size=384000 part=19 pcrc32=a8411113

Binary file not shown.

View File

@@ -0,0 +1,3 @@
=ybegin part=20 line=128 size=118119081 name=PC Pro 2011-07.pdf
=ypart begin=7296001 end=7680000
=yend size=384000 part=20 pcrc32=1159d67b

Binary file not shown.

View File

@@ -0,0 +1,3 @@
=ybegin part=21 line=128 size=118119081 name=PC Pro 2011-07.pdf
=ypart begin=7680001 end=8064000
=yend size=384000 part=21 pcrc32=424cc4a6

Binary file not shown.

View File

@@ -0,0 +1,3 @@
=ybegin part=22 line=128 size=118119081 name=PC Pro 2011-07.pdf
=ypart begin=8064001 end=8448000
=yend size=384000 part=22 pcrc32=4f48d686

Binary file not shown.

View File

@@ -0,0 +1,3 @@
=ybegin part=23 line=128 size=118119081 name=PC Pro 2011-07.pdf
=ypart begin=8448001 end=8832000
=yend size=384000 part=23 pcrc32=f4d9baaa

Binary file not shown.

View File

@@ -0,0 +1,3 @@
=ybegin part=24 line=128 size=118119081 name=PC Pro 2011-07.pdf
=ypart begin=8832001 end=9216000
=yend size=384000 part=24 pcrc32=40138344

Binary file not shown.

View File

@@ -0,0 +1,3 @@
=ybegin part=25 line=128 size=118119081 name=PC Pro 2011-07.pdf
=ypart begin=9216001 end=9600000
=yend size=384000 part=25 pcrc32=310a07cc

Binary file not shown.

View File

@@ -0,0 +1,3 @@
=ybegin part=26 line=128 size=118119081 name=PC Pro 2011-07.pdf
=ypart begin=9600001 end=9984000
=yend size=384000 part=26 pcrc32=c419b2c6

Binary file not shown.

View File

@@ -0,0 +1,3 @@
=ybegin part=27 line=128 size=118119081 name=PC Pro 2011-07.pdf
=ypart begin=9984001 end=10368000
=yend size=384000 part=27 pcrc32=ef0d0cc7

Binary file not shown.

View File

@@ -0,0 +1,3 @@
=ybegin part=28 line=128 size=118119081 name=PC Pro 2011-07.pdf
=ypart begin=10368001 end=10752000
=yend size=384000 part=28 pcrc32=dac071ff

Binary file not shown.

View File

@@ -0,0 +1,3 @@
=ybegin part=29 line=128 size=118119081 name=PC Pro 2011-07.pdf
=ypart begin=10752001 end=11136000
=yend size=384000 part=29 pcrc32=69634242

Binary file not shown.

View File

@@ -0,0 +1,3 @@
=ybegin part=30 line=128 size=118119081 name=PC Pro 2011-07.pdf
=ypart begin=11136001 end=11520000
=yend size=384000 part=30 pcrc32=5baebd23

Binary file not shown.

View File

@@ -0,0 +1,3 @@
=ybegin part=31 line=128 size=118119081 name=PC Pro 2011-07.pdf
=ypart begin=11520001 end=11904000
=yend size=384000 part=31 pcrc32=262b4192

Binary file not shown.

View File

@@ -0,0 +1,3 @@
=ybegin part=32 line=128 size=118119081 name=PC Pro 2011-07.pdf
=ypart begin=11904001 end=12288000
=yend size=384000 part=32 pcrc32=2640bb94

Binary file not shown.

View File

@@ -0,0 +1,3 @@
=ybegin part=33 line=128 size=118119081 name=PC Pro 2011-07.pdf
=ypart begin=12288001 end=12672000
=yend size=384000 part=33 pcrc32=f76ce29a

Binary file not shown.

View File

@@ -0,0 +1,3 @@
=ybegin part=34 line=128 size=118119081 name=PC Pro 2011-07.pdf
=ypart begin=12672001 end=13056000
=yend size=384000 part=34 pcrc32=eabd43a7

Binary file not shown.

View File

@@ -0,0 +1,3 @@
=ybegin part=35 line=128 size=118119081 name=PC Pro 2011-07.pdf
=ypart begin=13056001 end=13440000
=yend size=384000 part=35 pcrc32=a31c9a31

Binary file not shown.

View File

@@ -0,0 +1,3 @@
=ybegin part=36 line=128 size=118119081 name=PC Pro 2011-07.pdf
=ypart begin=13440001 end=13824000
=yend size=384000 part=36 pcrc32=5b51957b

Binary file not shown.

View File

@@ -0,0 +1,3 @@
=ybegin part=37 line=128 size=118119081 name=PC Pro 2011-07.pdf
=ypart begin=13824001 end=14208000
=yend size=384000 part=37 pcrc32=653597ab

Binary file not shown.

View File

@@ -0,0 +1,3 @@
=ybegin part=38 line=128 size=118119081 name=PC Pro 2011-07.pdf
=ypart begin=14208001 end=14592000
=yend size=384000 part=38 pcrc32=9d228c0a

Binary file not shown.

View File

@@ -0,0 +1,3 @@
=ybegin part=39 line=128 size=118119081 name=PC Pro 2011-07.pdf
=ypart begin=14592001 end=14976000
=yend size=384000 part=39 pcrc32=f1ac1bea

Binary file not shown.

View File

@@ -0,0 +1,3 @@
=ybegin part=40 line=128 size=118119081 name=PC Pro 2011-07.pdf
=ypart begin=14976001 end=15360000
=yend size=384000 part=40 pcrc32=8a0a21b4

Binary file not shown.

View File

@@ -0,0 +1,3 @@
=ybegin part=41 line=128 size=118119081 name=PC Pro 2011-07.pdf
=ypart begin=15360001 end=15744000
=yend size=384000 part=41 pcrc32=a80e0a0a

Binary file not shown.

View File

@@ -0,0 +1,3 @@
=ybegin part=42 line=128 size=118119081 name=PC Pro 2011-07.pdf
=ypart begin=15744001 end=16128000
=yend size=384000 part=42 pcrc32=7cb1a379

Binary file not shown.

View File

@@ -0,0 +1,3 @@
=ybegin part=43 line=128 size=118119081 name=PC Pro 2011-07.pdf
=ypart begin=16128001 end=16512000
=yend size=384000 part=43 pcrc32=9bbb4981

Binary file not shown.

View File

@@ -0,0 +1,3 @@
=ybegin part=44 line=128 size=118119081 name=PC Pro 2011-07.pdf
=ypart begin=16512001 end=16896000
=yend size=384000 part=44 pcrc32=3a61e84f

Binary file not shown.

View File

@@ -0,0 +1,3 @@
=ybegin part=45 line=128 size=118119081 name=PC Pro 2011-07.pdf
=ypart begin=16896001 end=17280000
=yend size=384000 part=45 pcrc32=2b19371c

Some files were not shown because too many files have changed in this diff Show More