From ce4f20c9a683d552486826058ab6d2b13baebf09 Mon Sep 17 00:00:00 2001 From: Samathy Barratt Date: Fri, 16 Apr 2021 15:46:13 +0100 Subject: [PATCH 1/2] Use pthreads to download podcasts in parallel. Spin up as many threads as there are podcasts to download - which is potentially a LOT of threads. Also, progress bars don't work. --- configure.ac | 4 ++ src/Makefile.am | 6 ++- src/channel.c | 129 +++++++++++++++++++++++++++++++++++++++--------- src/channel.h | 23 +++++++++ 4 files changed, 136 insertions(+), 26 deletions(-) diff --git a/configure.ac b/configure.ac index 17f6c8e..5afd53c 100644 --- a/configure.ac +++ b/configure.ac @@ -46,6 +46,10 @@ else AC_SUBST(CURL_LIBS) fi +PTHREAD_LIBS=-lpthread +AC_SUBST(PTHREAD_CFLAGS) +AC_SUBST(PTHREAD_LIBS) + #AC_ARG_WITH(taglib, [ --without-taglib disable taglib support]) AC_ARG_WITH(taglib, AC_HELP_STRING([--without-taglib], [disable taglib support])]) if test "x$with_taglib" != "xno"; then diff --git a/src/Makefile.am b/src/Makefile.am index 1a47806..4e45ce9 100644 --- a/src/Makefile.am +++ b/src/Makefile.am @@ -15,7 +15,7 @@ # License along with this library; if not, write to the Free Software # Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA # -AM_CPPFLAGS = $(GLIBS_CFLAGS) $(CURL_CFLAGS) +AM_CPPFLAGS = $(GLIBS_CFLAGS) $(CURL_CFLAGS) $(PTHREAD_CFLAGS) bin_PROGRAMS = castget @@ -47,4 +47,6 @@ castget_SOURCES = \ castget_LDADD = \ $(CURL_LIBS) \ $(GLIBS_LIBS) \ - $(TAGLIB_LIBS) + $(TAGLIB_LIBS) \ + $(PTHREAD_LIBS) \ + diff --git a/src/channel.c b/src/channel.c index 09b9335..4336232 100644 --- a/src/channel.c +++ b/src/channel.c @@ -29,7 +29,10 @@ #include "urlget.h" #include "utils.h" +#include #include +#include +#include #include #include #include @@ -278,6 +281,16 @@ static int _do_download(channel *c, channel_info *channel_info, rss_item *item, return download_failed; } +void *_do_download_thread(void *arg) +{ + download_data *data = (download_data *)arg; + // Resume and progress bars are disabled, because + // those will be tricky with threading. + data->result = _do_download(data->c, data->channel_info, data->item, + data->user_data, data->cb, 0, data->debug, 0); + pthread_exit(NULL); +} + static int _do_catchup(channel *c, channel_info *channel_info, rss_item *item, void *user_data, channel_callback cb) { @@ -292,6 +305,14 @@ static int _do_catchup(channel *c, channel_info *channel_info, rss_item *item, return 0; } +void *_do_catchup_thread(void *arg) +{ + catchup_data *data = (catchup_data *)arg; + data->result = _do_catchup(data->c, data->channel_info, data->item, + data->user_data, data->cb); + pthread_exit(NULL); +} + int channel_update(channel *c, void *user_data, channel_callback cb, int no_download, int no_mark_read, int first_only, int resume, enclosure_filter *filter, int debug, @@ -299,10 +320,17 @@ int channel_update(channel *c, void *user_data, channel_callback cb, { int i, download_failed; rss_file *f; + int num_catchup = 0; + int num_download = 0; + void *status; + int t_result; /* Retrieve the RSS file. */ f = _get_rss(c, user_data, cb, debug); + catchup_data catchup_items[f->num_items]; + download_data download_items[f->num_items]; + if (!f) return 1; @@ -317,35 +345,88 @@ int channel_update(channel *c, void *user_data, channel_callback cb, item = f->items[i]; if (!filter || _enclosure_pattern_match(filter, item->enclosure)) { - if (no_download) - download_failed = - _do_catchup(c, &(f->channel_info), item, user_data, cb); - else - download_failed = - _do_download(c, &(f->channel_info), item, user_data, cb, resume, - debug, show_progress_bar); - - if (download_failed) - break; - - if (!no_mark_read) { - /* Mark enclosure as downloaded and immediately save channel - file to ensure that it reflects the change. */ - g_hash_table_insert(c->downloaded_enclosures, - f->items[i]->enclosure->url, - (gpointer)get_rfc822_time()); - - _cast_channel_save(c, debug); + if (no_download) { + // download_failed = + //_do_catchup(c, &(f->channel_info), item, user_data, cb); + catchup_items[num_catchup] = + (catchup_data){ .c = c, + .channel_info = &(f->channel_info), + .item = item, + .user_data = user_data, + .cb = cb }; + num_catchup++; + } else { + // download_failed = + //_do_download(c, &(f->channel_info), item, user_data, cb, resume, + // debug, show_progress_bar); + download_items[num_download] = + (download_data){ .c = c, + .channel_info = &(f->channel_info), + .item = item, + .user_data = user_data, + .cb = cb, + .resume = resume, + .debug = debug, + .show_progress_bar = show_progress_bar }; + num_download++; } - - /* If we have been instructed to deal only with the first - available enclosure, it is time to break out of the loop. */ - if (first_only) - break; } + + /* If we have been instructed to deal only with the first + available enclosure, it is time to break out of the loop. */ + if (first_only) + break; } } + pthread_t catchup_threads[num_catchup]; + + for (i = 0; i < num_catchup; i++) { + pthread_create(&catchup_threads[i], NULL, _do_catchup_thread, + (void *)&catchup_items[i]); + } + + pthread_t download_threads[num_download]; + for (i = 0; i < num_download; i++) { + pthread_create(&download_threads[i], NULL, _do_download_thread, + (void *)&download_items[i]); + } + + for (i = 0; i < num_catchup; i++) { + t_result = pthread_join(catchup_threads[i], NULL); + if (t_result != 0) + printf(strerror(t_result)); + if (catchup_items[i].result != 0) { + download_failed = 1; + break; + } + if (!no_mark_read) { + /* Mark enclosure as downloaded and immediately save channel + file to ensure that it reflects the change. */ + g_hash_table_insert(c->downloaded_enclosures, f->items[i]->enclosure->url, + (gpointer)get_rfc822_time()); + + _cast_channel_save(c, debug); + } + } + + for (i = 0; i < num_download; i++) { + t_result = pthread_join(download_threads[i], NULL); + if (t_result != 0) + printf(strerror(t_result)); + if (download_items[i].result != 0 || download_failed) { + download_failed = 1; + printf("Download failed"); + break; + } + /* Mark enclosure as downloaded and immediately save channel + file to ensure that it reflects the change. */ + g_hash_table_insert(c->downloaded_enclosures, f->items[i]->enclosure->url, + (gpointer)get_rfc822_time()); + + _cast_channel_save(c, debug); + } + if (!no_mark_read) { /* Update the RSS last fetched time and save the channel file again. */ diff --git a/src/channel.h b/src/channel.h index 786577a..919315e 100644 --- a/src/channel.h +++ b/src/channel.h @@ -72,4 +72,27 @@ int channel_update(channel *c, void *user_data, channel_callback cb, enclosure_filter *enclosure_filter_new(const gchar *pattern, gboolean caseless); void enclosure_filter_free(enclosure_filter *e); +typedef struct _rss_item rss_item; + +typedef struct _download_data { + channel *c; + channel_info *channel_info; + rss_item *item; + void *user_data; + channel_callback cb; + int resume; + int debug; + int show_progress_bar; + int result; +} download_data; + +typedef struct _catchup_data { + channel *c; + channel_info *channel_info; + rss_item *item; + void *user_data; + channel_callback cb; + int result; +} catchup_data; + #endif /* CHANNEL_H */ From f78ee4eefc46a6689ac8cb262419300686d14ef4 Mon Sep 17 00:00:00 2001 From: Samathy Barratt Date: Fri, 16 Apr 2021 15:56:22 +0100 Subject: [PATCH 2/2] Can't have progress bars, so just print the title --- src/channel.c | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/src/channel.c b/src/channel.c index 4336232..2427b39 100644 --- a/src/channel.c +++ b/src/channel.c @@ -286,8 +286,12 @@ void *_do_download_thread(void *arg) download_data *data = (download_data *)arg; // Resume and progress bars are disabled, because // those will be tricky with threading. + if (data->show_progress_bar) + printf("Downloading: %s\n", data->item->title); data->result = _do_download(data->c, data->channel_info, data->item, data->user_data, data->cb, 0, data->debug, 0); + if (data->show_progress_bar) + printf("Download Complete: %s\n", data->item->title); pthread_exit(NULL); }