2020-11-29 01:55:31 +01:00
< ? php
/* spoolnews NNTP news spool creator
* Version : 0.3 . 0
* Download : https :// news . novabbs . com / getrslight
*
* E - Mail : retroguy @ novabbs . com
* Web : https :// news . novabbs . com
*
* This program is free software ; you can redistribute it and / or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation ; either version 2 of the License , or
* ( at your option ) any later version .
*
* This program is distributed in the hope that it will be useful ,
* but WITHOUT ANY WARRANTY ; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE . See the
* GNU General Public License for more details .
*
* You should have received a copy of the GNU General Public License
* along with this program ; if not , write to the Free Software
* Foundation , Inc . , 59 Temple Place , Suite 330 , Boston , MA 02111 - 1307 USA
*/
include " config.inc.php " ;
include ( " $file_newsportal " );
$remote_groupfile = $spooldir . " / " . $config_name . " / " . $CONFIG [ 'remote_server' ] . " : " . $CONFIG [ 'remote_port' ] . " .txt " ;
$file_groups = $config_path . " groups.txt " ;
$local_groupfile = $spooldir . " / " . $config_name . " /local_groups.txt " ;
$logfile = $logdir . '/spoolnews.log' ;
# END MAIN CONFIGURATION
@ mkdir ( $spooldir . " / " . $config_name , 0755 , 'recursive' );
if ( ! isset ( $maxarticles_per_run )) {
$maxarticles_per_run = 100 ;
}
if ( ! isset ( $maxfirstrequest )) {
2021-04-01 12:02:47 +02:00
$maxfirstrequest = 1000 ;
2020-11-29 01:55:31 +01:00
}
if ( ! isset ( $CONFIG [ 'enable_nntp' ]) || $CONFIG [ 'enable_nntp' ] != true ) {
$maxfirstrequest = $maxarticles ;
$maxarticles_per_run = $maxfetch ;
}
$workpath = $spooldir . " / " ;
$path = $workpath . " articles/ " ;
$lockfile = sys_get_temp_dir () . '/' . $config_name . '-spoolnews.lock' ;
$pid = file_get_contents ( $lockfile );
if ( posix_getsid ( $pid ) === false || ! is_file ( $lockfile )) {
print " Starting Spoolnews... \n " ;
file_put_contents ( $lockfile , getmypid ()); // create lockfile
} else {
print " Spoolnews currently running \n " ;
exit ;
}
$sem = $spooldir . " / " . $config_name . " .reload " ;
if ( is_file ( $sem )) {
unlink ( $remote_groupfile );
unlink ( $sem );
$maxfirstrequest = 20 ;
}
2021-01-09 02:41:29 +01:00
if ( filemtime ( $spooldir . '/' . $config_name . '-thread-timer' ) + 600 < time ()) {
$timer = true ;
touch ( $spooldir . '/' . $config_name . '-thread-timer' );
} else {
$timer = false ;
}
2020-11-29 01:55:31 +01:00
# Check for groups file, create if necessary
create_spool_groups ( $file_groups , $remote_groupfile );
create_spool_groups ( $file_groups , $local_groupfile );
# Iterate through groups
$enable_rslight = 0 ;
# Refresh group list
$menulist = file ( $config_dir . " menu.conf " , FILE_IGNORE_NEW_LINES | FILE_SKIP_EMPTY_LINES );
foreach ( $menulist as $menu ) {
if (( $menu [ 0 ] == '#' ) || ( trim ( $menu ) == " " )) {
continue ;
}
$menuitem = explode ( ':' , $menu );
if (( $menuitem [ 0 ] == $config_name ) && ( $menuitem [ 1 ] == '1' )) {
groups_read ( $server , $port , 1 );
$enable_rslight = 1 ;
echo " Loaded groups \n " ;
}
}
$ns = nntp2_open ( $CONFIG [ 'remote_server' ], $CONFIG [ 'remote_port' ]);
$ns2 = nntp_open ();
2021-02-19 06:10:43 +01:00
if ( ! $ns ) {
2020-11-29 01:55:31 +01:00
file_put_contents ( $logfile , " \n " . format_log_date () . " " . $config_name . " Failed to connect to " . $CONFIG [ 'remote_server' ] . " : " . $CONFIG [ 'remote_port' ], FILE_APPEND );
exit ();
}
2021-04-01 12:02:47 +02:00
$grouplist = file ( $config_dir . '/' . $config_name . '/groups.txt' , FILE_IGNORE_NEW_LINES | FILE_SKIP_EMPTY_LINES );
2020-11-29 01:55:31 +01:00
foreach ( $grouplist as $findgroup ) {
2021-04-01 12:02:47 +02:00
if ( $findgroup [ 0 ] == " : " ) {
continue ;
}
$name = preg_split ( " /( | \t )/ " , $findgroup , 2 );
2020-11-29 01:55:31 +01:00
file_put_contents ( $logfile , " \n " . format_log_date () . " " . $config_name . " Retrieving articles for: " . $name [ 0 ] . " ... " , FILE_APPEND );
echo " \n Retrieving articles for: " . $name [ 0 ] . " ... \r \n " ;
get_articles ( $ns , $name [ 0 ]);
2020-12-26 00:24:34 +01:00
2020-11-29 01:55:31 +01:00
if ( $enable_rslight == 1 ) {
2021-01-09 02:41:29 +01:00
if ( $timer ) {
file_put_contents ( $logfile , " \n " . format_log_date () . " " . $config_name . " Updating threads for: " . $name [ 0 ] . " ... " , FILE_APPEND );
thread_load_newsserver ( $ns2 , $name [ 0 ], 0 );
}
2020-11-29 01:55:31 +01:00
}
}
nntp_close ( $ns2 );
nntp_close ( $ns );
#expire_overview();
unlink ( $lockfile );
echo " \n Spoolnews Done \r \n " ;
function get_articles ( $ns , $group ) {
2020-12-19 02:22:42 +01:00
global $enable_rslight , $spooldir , $CONFIG , $maxarticles_per_run , $maxfirstrequest , $workpath , $path , $remote_groupfile , $local_groupfile , $local , $logdir , $config_name , $logfile ;
2020-11-29 01:55:31 +01:00
if ( $ns == false ) {
file_put_contents ( $logfile , " \n " . format_log_date () . " " . $config_name . " Lost connection to " . $CONFIG [ 'remote_server' ] . " : " . $CONFIG [ 'remote_port' ], FILE_APPEND );
exit ();
}
$grouppath = $path . preg_replace ( '/\./' , '/' , $group );
$banned_names = file ( " /etc/rslight/banned_names.conf " , FILE_IGNORE_NEW_LINES | FILE_SKIP_EMPTY_LINES );
$nocem_check = " @@NCM " ;
2021-02-06 12:22:45 +01:00
2020-11-29 01:55:31 +01:00
# Check if group exists. Open it if it does
fputs ( $ns , " group " . $group . " \r \n " );
$response = line_read ( $ns );
if ( strcmp ( substr ( $response , 0 , 3 ), " 411 " ) == 0 ) {
echo " \n " . $response . " \n " ;
return ( 1 );
}
# Get config
$grouplist = file ( $remote_groupfile , FILE_IGNORE_NEW_LINES | FILE_SKIP_EMPTY_LINES );
foreach ( $grouplist as $findgroup ) {
$name = explode ( ':' , $findgroup );
if ( strcmp ( $name [ 0 ], $group ) == 0 ) {
if ( isset ( $name [ 1 ]))
$article = $name [ 1 ] + 1 ;
break ;
}
}
if ( isset ( $CONFIG [ 'enable_nntp' ]) && $CONFIG [ 'enable_nntp' ] == true ) {
2021-01-05 08:04:05 +01:00
// Try to find last article number in local_groupfile
2021-01-08 06:48:56 +01:00
$local = get_high_watermark ( $group );
2021-01-05 08:04:05 +01:00
if ( ! is_numeric ( $local )) {
2021-01-20 23:54:47 +01:00
$ok_article = get_article_list ( $group );
2021-01-05 08:04:05 +01:00
sort ( $ok_article );
$local = $ok_article [ key ( array_slice ( $ok_article , - 1 , 1 , true ))];
if ( ! is_numeric ( $local )) {
$local = 0 ;
2020-11-29 01:55:31 +01:00
}
2021-02-22 09:47:49 +01:00
$local = $local + 1 ;
2021-01-05 08:04:05 +01:00
}
2020-11-29 01:55:31 +01:00
if ( $local < 1 )
$local = 1 ;
}
2021-01-08 06:48:56 +01:00
# Split group response line to get last article number
2020-11-29 01:55:31 +01:00
$detail = explode ( " " , $response );
if ( ! isset ( $article )) {
$article = $detail [ 2 ];
}
if ( $article < $detail [ 3 ] - $maxfirstrequest ) {
$article = $detail [ 3 ] - $maxfirstrequest ;
}
if ( $article < $detail [ 2 ]) {
$article = $detail [ 2 ];
}
// Broken message on last run? Let's try again.
if ( $article > ( $detail [ 3 ] + 1 )) {
$article = $detail [ 3 ];
}
2021-03-08 09:43:06 +01:00
# Prepare databases
$database = $spooldir . '/articles-overview.db3' ;
$table = 'overview' ;
$dbh = rslight_db_open ( $database , $table );
$sql = 'INSERT INTO ' . $table . '(newsgroup, number, msgid, date, name, subject) VALUES(?,?,?,?,?,?)' ;
$stmt = $dbh -> prepare ( $sql );
if ( $CONFIG [ 'article_database' ] == '1' ) {
$article_dbh = article_db_open ( $spooldir . '/' . $group . '-articles.db3' );
$article_sql = 'INSERT INTO articles(newsgroup, number, msgid, date, name, subject, article, search_snippet) VALUES(?,?,?,?,?,?,?,?)' ;
$article_stmt = $article_dbh -> prepare ( $article_sql );
}
2020-11-29 01:55:31 +01:00
# Pull articles and save them in our spool
@ mkdir ( $grouppath , 0755 , 'recursive' );
$i = 0 ;
while ( $article <= $detail [ 3 ]) {
if ( ! is_numeric ( $article )) {
file_put_contents ( $logfile , " \n " . format_log_date () . " " . $config_name . " DEBUG This should show server group:article number: " . $CONFIG [ 'remote_server' ] . " " . $group . " : " . $article , FILE_APPEND );
break ;;
}
if ( $CONFIG [ 'enable_nntp' ] != true ){
$local = $article ;
}
// Check for duplicate msgid
$duplicate = 0 ;
fputs ( $ns , " stat " . $article . " \r \n " );
$response = line_read ( $ns );
$this_msgid = explode ( ' ' , $response );
$group_overviewfp = fopen ( $spooldir . " / " . $group . " -overview " , 'r' );
while ( $group_overview = fgets ( $group_overviewfp , 2048 )) {
$overview_msgid = explode ( " \t " , $group_overview );
if ( strpos ( $overview_msgid [ 4 ], $this_msgid [ 2 ]) !== false ) {
echo " \n Duplicate Message-ID for: " . $CONFIG [ 'remote_server' ] . " " . $group . " : " . $article . " \n " ;
file_put_contents ( $logfile , " \n " . format_log_date () . " " . $config_name . " Duplicate Message-ID for: " . $CONFIG [ 'remote_server' ] . " " . $group . " : " . $article , FILE_APPEND );
$article ++ ;
$duplicate = 1 ;
break ;
}
}
fclose ( $group_overviewfp );
if ( $duplicate == 1 ) {
continue ;
}
fputs ( $ns , " article " . $article . " \r \n " );
$response = line_read ( $ns );
if ( strcmp ( substr ( $response , 0 , 3 ), " 220 " ) != 0 ) {
echo " \n " . $response . " \n " ;
file_put_contents ( $logfile , " \n " . format_log_date () . " " . $config_name . " Unexpected response to ARTICLE command: " . $response , FILE_APPEND );
$article ++ ;
continue ;
}
if ( isset ( $CONFIG [ 'enable_nntp' ]) && $CONFIG [ 'enable_nntp' ] == true ){
while ( is_file ( $grouppath . " / " . $local )) {
$local ++ ;
}
}
$articleHandle = fopen ( $grouppath . " / " . $local , 'w+' );
$response = line_read ( $ns );
$lines = 0 ;
$bytes = 0 ;
$ref = 0 ;
$banned = 0 ;
$is_header = 1 ;
2021-03-08 09:43:06 +01:00
$body = " " ;
2020-11-29 01:55:31 +01:00
while ( strcmp ( $response , " . " ) != 0 )
{
$bytes = $bytes + mb_strlen ( $response , '8bit' );
if ( trim ( $response ) == " " || $lines > 0 ) {
$is_header = 0 ;
$lines ++ ;
}
if ( $is_header == 1 ) {
2021-01-29 03:07:29 +01:00
$response = str_replace ( " \t " , " " , $response );
2020-11-29 01:55:31 +01:00
// Find article date
if ( stripos ( $response , " Date: " ) === 0 ) {
2021-01-29 03:07:29 +01:00
$finddate = explode ( ': ' , $response , 2 );
2020-11-29 01:55:31 +01:00
$article_date = strtotime ( $finddate [ 1 ]);
}
// Get overview data
if ( stripos ( $response , " Message-ID: " ) === 0 ) {
2021-01-29 03:07:29 +01:00
$mid = explode ( ': ' , $response , 2 );
2020-11-29 01:55:31 +01:00
$ref = 0 ;
}
if ( stripos ( $response , " From: " ) === 0 ) {
2021-01-29 03:07:29 +01:00
$from = explode ( ': ' , $response , 2 );
2020-11-29 01:55:31 +01:00
if ( isset ( $CONFIG [ 'enable_nntp' ]) && $CONFIG [ 'enable_nntp' ] == true ) {
foreach ( $banned_names as $banned_name ) {
if ( stripos ( $from [ 1 ], $banned_name ) !== false ) {
$banned = 1 ;
}
}
}
$ref = 0 ;
}
if ( stripos ( $response , " Subject: " ) === 0 ) {
$subject = explode ( 'Subject: ' , $response , 2 );
$ref = 0 ;
}
if ( stripos ( $response , " Newsgroups: " ) === 0 ) {
$response = str_ireplace ( $group , $group , $response );
$ref = 0 ;
}
if ( stripos ( $response , " Xref: " ) === 0 ) {
if ( isset ( $CONFIG [ 'enable_nntp' ]) && $CONFIG [ 'enable_nntp' ] == true ) {
$response = " Xref: " . $CONFIG [ 'pathhost' ] . " " . $group . " : " . $local ;
}
$xref = $response ;
$ref = 0 ;
}
2021-03-08 09:43:06 +01:00
if ( stripos ( $response , " Content-Type: " ) === 0 ) {
preg_match ( '/.*charset=.*/' , $response , $te );
$content_type = explode ( " Content-Type: text/plain; charset= " , $te [ 0 ]);
}
2020-11-29 01:55:31 +01:00
if ( stripos ( $response , " References: " ) === 0 ) {
$this_references = explode ( 'References: ' , $response );
$references = $this_references [ 1 ];
$ref = 1 ;
}
if (( stripos ( $response , ':' ) === false ) && ( strpos ( $response , '>' ))) {
if ( $ref == 1 ) {
$references = $references . $response ;
}
}
2021-03-08 09:43:06 +01:00
} else {
$body .= $response . " \n " ;
2020-11-29 01:55:31 +01:00
}
fputs ( $articleHandle , $response . " \n " );
// Check here for broken $ns connection before continuing
$response = fgets ( $ns , 1200 );
if ( $response == false ) {
file_put_contents ( $logfile , " \n " . format_log_date () . " " . $config_name . " Lost connection to " . $CONFIG [ 'remote_server' ] . " : " . $CONFIG [ 'remote_port' ] . " retrieving article " . $article , FILE_APPEND );
@ fclose ( $articleHandle );
unlink ( $grouppath . " / " . $local );
continue ;
}
$response = str_replace ( " \n " , " " , str_replace ( " \r " , " " , $response ));
}
fputs ( $articleHandle , $response . " \n " );
@ fclose ( $articleHandle );
$lines = $lines - 1 ;
$bytes = $bytes + ( $lines * 2 );
// Don't spool article if $banned=1
if ( $banned == 1 ) {
@ fclose ( $articleHandle );
unlink ( $grouppath . " / " . $local );
file_put_contents ( $logfile , " \n " . format_log_date () . " " . $config_name . " Skipping: " . $CONFIG [ 'remote_server' ] . " " . $group . " : " . $article . " user: " . $from [ 1 ] . " is banned " , FILE_APPEND );
$article ++ ;
} else {
if (( strpos ( $CONFIG [ 'nocem_groups' ], $group ) !== false ) && ( $CONFIG [ 'enable_nocem' ] == true )) {
if ( strpos ( $subject [ 1 ], $nocem_check ) !== false ) {
$nocem_file = tempnam ( $spooldir . " /nocem " , " nocem- " . $group . " - " );
copy ( $grouppath . " / " . $local , $nocem_file );
}
}
// Overview
$overviewHandle = fopen ( $workpath . $group . " -overview " , 'a' );
fputs ( $overviewHandle , $local . " \t " . $subject [ 1 ] . " \t " . $from [ 1 ] . " \t " . $finddate [ 1 ] . " \t " . $mid [ 1 ] . " \t " . $references . " \t " . $bytes . " \t " . $lines . " \t " . $xref . " \n " );
fclose ( $overviewHandle );
$references = " " ;
2021-01-20 23:54:47 +01:00
// add to database
2020-12-12 05:16:13 +01:00
$stmt -> execute ([ $group , $local , $mid [ 1 ], $article_date , $from [ 1 ], $subject [ 1 ]]);
2021-01-20 23:54:47 +01:00
if ( $CONFIG [ 'article_database' ] == '1' ) {
$this_article = file_get_contents ( $grouppath . " / " . $local );
2021-03-08 09:43:06 +01:00
// CREATE SEARCH SNIPPET
$this_snippet = get_search_snippet ( $body , $content_type [ 1 ]);
$article_stmt -> execute ([ $group , $local , $mid [ 1 ], $article_date , $from [ 1 ], $subject [ 1 ], $this_article , $this_snippet ]);
2021-01-20 23:54:47 +01:00
unlink ( $grouppath . " / " . $local );
} else {
if ( $article_date > time ())
$article_date = time ();
touch ( $grouppath . " / " . $local , $article_date );
}
2020-11-29 01:55:31 +01:00
echo " \n Retrieved: " . $group . " " . $article . " \n " ;
file_put_contents ( $logfile , " \n " . format_log_date () . " " . $config_name . " Wrote to spool: " . $CONFIG [ 'remote_server' ] . " " . $group . " : " . $article , FILE_APPEND );
$i ++ ;
$article ++ ;
$local ++ ;
2021-04-28 06:12:10 +02:00
if ( $i > $maxarticles_per_run ) {
break ;
}
2020-11-29 01:55:31 +01:00
}
}
$article -- ;
// $local--;
// Update title
if ( ! is_file ( $workpath . $group . " -title " )) {
fputs ( $ns , " XGTITLE " . $group . " \r \n " );
$response = line_read ( $ns );
if ( strcmp ( substr ( $response , 0 , 3 ), " 282 " ) == 0 ) {
$overviewHandle = fopen ( $workpath . $group . " -title " , 'w' );
$response = line_read ( $ns );
while ( strcmp ( $response , " . " ) != 0 )
{
fputs ( $overviewHandle , $response . " \r \n " );
$response = line_read ( $ns );
}
@ fclose ( $overviewHandle );
}
}
# Save config
$grouplist = file ( $remote_groupfile , FILE_IGNORE_NEW_LINES | FILE_SKIP_EMPTY_LINES );
$saveconfig = fopen ( $remote_groupfile , 'w+' );
foreach ( $grouplist as $savegroup ) {
$name = explode ( ':' , $savegroup );
if ( strcmp ( $name [ 0 ], $group ) == 0 ) {
fputs ( $saveconfig , $group . " : " . $article . " \n " );
} else {
fputs ( $saveconfig , $savegroup . " \n " );
}
}
fclose ( $saveconfig );
$grouplist = file ( $local_groupfile , FILE_IGNORE_NEW_LINES | FILE_SKIP_EMPTY_LINES );
$saveconfig = fopen ( $local_groupfile , 'w+' );
foreach ( $grouplist as $savegroup ) {
$name = explode ( ':' , $savegroup );
if ( strcmp ( $name [ 0 ], $group ) == 0 ) {
fputs ( $saveconfig , $group . " : " . $local . " \n " );
} else {
fputs ( $saveconfig , $savegroup . " \n " );
}
}
fclose ( $saveconfig );
2021-01-20 23:54:47 +01:00
if ( $CONFIG [ 'article_database' ] == '1' ) {
$article_dbh = null ;
}
2020-12-12 05:16:13 +01:00
$dbh = null ;
2020-11-29 01:55:31 +01:00
}
function create_spool_groups ( $in_groups , $out_groups ) {
$grouplist = file ( $in_groups , FILE_IGNORE_NEW_LINES | FILE_SKIP_EMPTY_LINES );
$groupout = fopen ( $out_groups , " a+ " );
foreach ( $grouplist as $group ) {
if ( $group [ 0 ] == " : " ) {
continue ;
}
$thisgroup = preg_split ( " /( | \t )/ " , $group , 2 );
fseek ( $groupout , 0 );
$found = 0 ;
while (( $buffer = fgets ( $groupout )) !== false ) {
if ( stripos ( $buffer , $thisgroup [ 0 ]) !== false ) {
$found = 1 ;
break ;
}
}
if ( $found == 0 ) {
fwrite ( $groupout , $thisgroup [ 0 ] . " \r \n " );
continue ;
}
}
fclose ( $groupout );
return ;
}
2021-01-08 06:48:56 +01:00
function get_high_watermark ( $group ) {
global $local_groupfile ;
if ( $configFileHandle = @ fopen ( $local_groupfile , 'r' ))
{
while ( ! feof ( $configFileHandle ))
{
$buffer = fgets ( $configFileHandle );
if ( strpos ( $buffer , $group . ':' ) !== FALSE ) {
$dataline = $buffer ;
fclose ( $configFileHandle );
$datafound = explode ( ':' , $dataline );
return trim ( $datafound [ 1 ]);
}
}
fclose ( $configFileHandle );
return FALSE ;
} else {
return FALSE ;
}
}
2021-01-20 23:54:47 +01:00
function get_article_list ( $thisgroup ) {
global $spooldir ;
$group_overviewfp = fopen ( $spooldir . " / " . $thisgroup . " -overview " , 'r' );
$ok_article = array ();
while ( $line = fgets ( $group_overviewfp )) {
$art = explode ( " \t " , $line );
if ( is_numeric ( $art [ 0 ])) {
$ok_article [] = $art [ 0 ];
}
}
fclose ( $group_overviewfp );
return ( $ok_article );
}
2020-11-29 01:55:31 +01:00
?>