[Enhancement]: Add audioteka.com.pl as metadata provider #2073

New Issue

2026-04-25T00:03:10+02:00

adam commented

2026-04-25 00:03:10 +02:00

Originally created by @izikeros on GitHub (Jun 27, 2024).

Type of Enhancement

Server Backend

Describe the Feature/Enhancement

There is a service (Audioteka) that provides wide collection of audiobooks and has metadata for them. In audiobookshelf there are already providers of metadata, covers - this would be another possible source of metadata.

Why would this be helpful?

It would complement existing sources since it can provide metadata in Polish language. Use case: user has a collection of polish audiobooks (e.g. titles are in polish) and would like to enrich the library with metadata

Future Implementation (Screenshot)

I have some context info to AI and generated the code that has some chance to work. I'm not a javascript programmer and can't run/debug it. This might be some starting point.

const axios = require('axios').default
const cheerio = require('cheerio')
const Logger = require('../Logger')

class AudiotekaProvider {
  #responseTimeout = 30000

  constructor() {}

  /**
   * Search for an audiobook on audioteka.com.pl
   * @param {string} title
   * @param {string} author
   * @param {string} isbn
   * @param {string} providerSlug
   * @param {string} mediaType
   * @param {number} [timeout] response timeout in ms
   * @returns {Promise<Object[]>}
   */
  async search(title, author, isbn, providerSlug, mediaType, timeout = this.#responseTimeout) {
    if (!timeout || isNaN(timeout)) timeout = this.#responseTimeout

    const encodedTitle = encodeURIComponent(title)
    const url = `https://audioteka.com/pl/search?query=${encodedTitle}`

    try {
      const response = await axios.get(url, { timeout })
      const $ = cheerio.load(response.data)

      const results = []
      $('.product-tile').each((index, element) => {
        const productUrl = $(element).find('a').attr('href')
        results.push(this.scrapeAudiobookDetails(productUrl))
      })

      return Promise.all(results)
    } catch (error) {
      Logger.error('[AudiotekaProvider] Search error', error)
      return []
    }
  }

  /**
   * Scrape audiobook details from a specific URL
   * @param {string} url
   * @returns {Promise<Object>}
   */
  async scrapeAudiobookDetails(url) {
    try {
      const response = await axios.get(url, { timeout: this.#responseTimeout })
      const $ = cheerio.load(response.data)

      const jsonLd = JSON.parse($('script[type="application/ld+json"]').html())

      const title = jsonLd.name
      const authors = jsonLd.author.split(', ')
      const narrator = jsonLd.readBy
      const publisher = jsonLd.publisher
      const publishedYear = new Date(jsonLd.datePublished).getFullYear()
      const description = $('article p').text().trim()
      const cover = jsonLd.image

      return {
        title,
        subtitle: null,
        author: authors.join(', '),
        narrator,
        publisher,
        publishedYear,
        description,
        cover,
        isbn: null,
        asin: null,
        genres: null,
        tags: null,
        series: null,
        language: 'pl',
        duration: null
      }
    } catch (error) {
      Logger.error('[AudiotekaProvider] Scraping error', error)
      return null
    }
  }
}

module.exports = AudiotekaProvider

Audiobookshelf Server Version

v2.10.1

Current Implementation (Screenshot)

None

Originally created by @izikeros on GitHub (Jun 27, 2024). ### Type of Enhancement Server Backend ### Describe the Feature/Enhancement There is a service (Audioteka) that provides wide collection of audiobooks and has metadata for them. In audiobookshelf there are already providers of metadata, covers - this would be another possible source of metadata. ### Why would this be helpful? It would complement existing sources since it can provide metadata in Polish language. Use case: user has a collection of polish audiobooks (e.g. titles are in polish) and would like to enrich the library with metadata ### Future Implementation (Screenshot) I have some context info to AI and generated the code that has some chance to work. I'm not a javascript programmer and can't run/debug it. This might be some starting point. ```js const axios = require('axios').default const cheerio = require('cheerio') const Logger = require('../Logger') class AudiotekaProvider { #responseTimeout = 30000 constructor() {} /** * Search for an audiobook on audioteka.com.pl * @param {string} title * @param {string} author * @param {string} isbn * @param {string} providerSlug * @param {string} mediaType * @param {number} [timeout] response timeout in ms * @returns {Promise<Object[]>} */ async search(title, author, isbn, providerSlug, mediaType, timeout = this.#responseTimeout) { if (!timeout || isNaN(timeout)) timeout = this.#responseTimeout const encodedTitle = encodeURIComponent(title) const url = `https://audioteka.com/pl/search?query=${encodedTitle}` try { const response = await axios.get(url, { timeout }) const $ = cheerio.load(response.data) const results = [] $('.product-tile').each((index, element) => { const productUrl = $(element).find('a').attr('href') results.push(this.scrapeAudiobookDetails(productUrl)) }) return Promise.all(results) } catch (error) { Logger.error('[AudiotekaProvider] Search error', error) return [] } } /** * Scrape audiobook details from a specific URL * @param {string} url * @returns {Promise<Object>} */ async scrapeAudiobookDetails(url) { try { const response = await axios.get(url, { timeout: this.#responseTimeout }) const $ = cheerio.load(response.data) const jsonLd = JSON.parse($('script[type="application/ld+json"]').html()) const title = jsonLd.name const authors = jsonLd.author.split(', ') const narrator = jsonLd.readBy const publisher = jsonLd.publisher const publishedYear = new Date(jsonLd.datePublished).getFullYear() const description = $('article p').text().trim() const cover = jsonLd.image return { title, subtitle: null, author: authors.join(', '), narrator, publisher, publishedYear, description, cover, isbn: null, asin: null, genres: null, tags: null, series: null, language: 'pl', duration: null } } catch (error) { Logger.error('[AudiotekaProvider] Scraping error', error) return null } } } module.exports = AudiotekaProvider ``` ### Audiobookshelf Server Version v2.10.1 ### Current Implementation (Screenshot) None

adam added the enhancement label 2026-04-25 00:03:10 +02:00

adam closed this issue

2026-04-25 00:03:10 +02:00

adam commented

2026-04-25 00:03:11 +02:00

@izikeros commented on GitHub (Jun 27, 2024):

There are guys that tried scrap the data, and produce OPF file in #602

@izikeros commented on GitHub (Jun 27, 2024): There are guys that tried scrap the data, and produce OPF file in #602

adam commented

2026-04-25 00:03:11 +02:00

@nichwall commented on GitHub (Jun 27, 2024):

Duplicate of https://github.com/advplyr/audiobookshelf/issues/2598

Can you provide public API documentation? If there is not a public API (requiring scraping the web page within ABS), this would fit better as a custom metadata provider instead of being within ABS.

https://www.audiobookshelf.org/guides/custom-metadata-providers

@nichwall commented on GitHub (Jun 27, 2024): Duplicate of https://github.com/advplyr/audiobookshelf/issues/2598 Can you provide public API documentation? If there is not a public API (requiring scraping the web page within ABS), this would fit better as a custom metadata provider instead of being within ABS. https://www.audiobookshelf.org/guides/custom-metadata-providers

adam referenced this issue

2026-04-25 00:08:26 +02:00

[Bug]: Podcast library page load time is very high #2564

adam referenced this issue

2026-04-25 00:18:26 +02:00

[PR #3952] [MERGED] Improve book library page query performance on title, titleIgnorePrefix, and addedAt sort orders. #4129

adam referenced this issue

2026-04-25 00:18:36 +02:00

[PR #4080] [MERGED] Improve book library page query performance for author sort order #4162

Sign in to join this conversation.

Branches Tags

master

book_tags_genres_dedupe

episode_download_fallback

Issue-4540-SortBy-StartedDate-and-FinishedDate

episode_meta_tagging

fix_authorize_race_condition

redirect_transcode_requests

progress_updated_sort

fix_ereader_socket_event

fix_change_empty_root_password

fix_podcast_session_track_index

fix_set_token

session_modal_user

localize_durations

fix_oidc_create_user

jwt_auth_refactor

fix_scanner_deleting_single_file_books

fix_mediaprogress_updatedat_2

experimental_next_client

podcast_episode_duration

episode-timestamps-clickable

book_author_secondary_sort_title

podcast_useragents

pathexists_user_access

fix_pathexists_join

book_author_secondary_sort

clean_duplicate_mediaprogress

sanitize_html_description

trix_prevent_attachments

check_path_api_fix

fix_mediaprogress_updatedat

increase_express_json_limit

fix_dockerfile_nunicode

search_episodes

audiobook_tools_update

episode_secondary_sorts

hls_stream_url_update

new_session_track_endpoint

audiobook_tools_enhancements

watcher_rescans_update

player_track_tooltip

fix_exclude_prefixes_crash

socket_item_events

fix_podcast_episode_scanner_promise

new_stats_controller

count_cache_for_userpermissions

parsing-opf-v3

validate_migration_files

fix-quick-match-all-crash

fix-chapter-end-sleep-timer

stringify_sequelize_query

remove-col-ambiguity

fix_next_prev_edit_description

details_trim_whitespace

fix_content_url_basepath

fix_logger_fatal

progress_bar_visibility

batch-edit-populate-map-details

feed_generator_updates

bookmark-modal-updates

migrate-library-item-in-scanner

migrate-new-library-items

migrate-podcasts-new-library-item-2

migrate-podcasts-new-library-item

fix-remove-episode-from-playlist

playback-session-use-new-library-item

refactor-library-item

fix-heatmap-caption

feed-episodes-upsert

share-media-player-media-session-api

remove-old-playlist

remove_old_collection_object

plugin-implementation-demo

feed_migration

refactor-feeds-from-item

fix_remove_authors_no_books

v2.17.3-fk-constraints-migration

migrations-first-upgrade

sqlite_2

feature/nuxt-target-server

waveform

sqlite

playlists

video

1 Participants

Notifications

Due Date

No due date set.

Dependencies

No dependencies set.

Reference: starred/audiobookshelf#2073