NAME

MARC::Convert::Wikidata::Utils - Utilities for MARC::Convert::Wikidata.

SYNOPSIS

use MARC::Convert::Wikidata::Utils qw(clean_cover clean_date clean_edition_number clean_issn clean_number_of_pages clean_oclc clean_publication_date clean_publisher_name clean_publisher_place clean_series_name clean_series_ordinal clean_subtitle clean_title look_for_external_id);

my $cleaned_cover = clean_cover($cover);
my $cleaned_date = clean_date($date);
my ($cleaned_date, $options_hr) = clean_date($date);
my $cleaned_edition_number = clean_edition_number($edition_number);
my $cleaned_issn = clean_issn($issn);
my $cleaned_number_of_pages = clean_number_of_pages($number_of_pages);
my $cleaned_oclc = clean_oclc($oclc);
my ($cleaned_publication_date, $option) = clean_publication_date($publication_date);
my $cleaned_publisher_name = clean_publisher_name($publisher);
my $cleaned_publisher_place = clean_publisher_place($publisher_place);
my $cleaned_series_name = clean_series_name($series_name);
my $cleaned_series_ordinal = clean_series_ordinal($series_ordinal);
my $cleaned_subtitle = clean_subitle($subtitle);
my $cleaned_title = clean_title($title);
my $value = look_for_external_id($object, $external_id_name, $deprecation_flag);
my @values = look_for_external_id($object, $external_id_name, $deprecation_flag);

SUBROUTINES

clean_cover

my $cleaned_cover = clean_cover($cover);

Clean book cover in Czech language.

Returns string or undef.

clean_date

my $cleaned_date = clean_date($date);
my ($cleaned_date, $options_hr) = clean_date($date);

Clean date in Czech language.

Returns string or undef in scalar context. Returns string or undef of date and hash reference with options in array context.

clean_edition_number

my $cleaned_edition_number = clean_edition_number($edition_number);

Clean edition number in Czech language.

Returns string or undef.

clean_issn

my $cleaned_issn = clean_issn($issn);

Clean ISSN.

Returns string or undef.

clean_number_of_pages

my $cleaned_number_of_pages = clean_number_of_pages($number_of_pages);

Clean number of pages in Czech language.

Returns string or undef.

clean_oclc

my $cleaned_oclc = clean_oclc($oclc);

Clean OCLC number.

Returns string or undef.

clean_publication_date

my ($cleaned_publication_date, $option) = clean_publication_date($publication_date);

Clean publication date. Returned options could be 'circa' string in case that publication date is not precise.

Returns array with string or undef and string.

clean_publisher_name

my $cleaned_publisher_name = clean_publisher_name($publisher);

Clean publishing house.

Returns string or undef.

clean_publisher_place

my $cleaned_publisher_place = clean_publisher_place($publisher_place);

Clean place of publication in Czech language.

Returns string or undef.

clean_series_name

my $cleaned_series_name = clean_series_name($series_name);

Clean series name.

Returns string or undef.

clean_series_ordinal

my $cleaned_series_ordinal = clean_series_ordinal($series_ordinal);

Clean series ordinal in Czech language.

Returns string or undef.

clean_subtitle

my $cleaned_subtitle = clean_subtitle($subtitle);

Clean subtitle.

Returns string or undef.

clean_title

my $cleaned_title = clean_title($title);

Clean title.

Returns string or undef.

look_for_external_id

my $value = look_for_external_id($object, $external_id_name, $deprecation_flag);
my @values = look_for_external_id($object, $external_id_name, $deprecation_flag);

Look for external id values defined by name and deprecation flag.

Returns strings.

EXAMPLE1

use strict;
use warnings;

use MARC::Convert::Wikidata::Utils qw(clean_cover);
use Unicode::UTF8 qw(decode_utf8 encode_utf8);

my $cover = decode_utf8('(Vázáno) :');;
my $cleaned_cover = clean_cover($cover);

# Print out.
print encode_utf8("Cover: $cover\n");
print "Cleaned cover: $cleaned_cover\n";

# Output:
# Cover: (Vázáno) :
# Cleaned cover: hardback

EXAMPLE2

use strict;
use warnings;

use MARC::Convert::Wikidata::Utils qw(clean_date);
use Unicode::UTF8 qw(decode_utf8 encode_utf8);

my $date = decode_utf8('2020 březen 03.');
my $cleaned_date = clean_date($date);

# Print out.
print encode_utf8("Date: $date\n");
print "Cleaned date: $cleaned_date\n";

# Output:
# Date: 2020 březen 03.
# Cleaned date: 2020-03-03

EXAMPLE3

use strict;
use warnings;

use MARC::Convert::Wikidata::Utils qw(clean_edition_number);
use Unicode::UTF8 qw(decode_utf8 encode_utf8);

my $edition_number = decode_utf8('Druhé vydání');
my $cleaned_edition_number = clean_edition_number($edition_number);

# Print out.
print encode_utf8("Edition number: $edition_number\n");
print "Cleaned edition number: $cleaned_edition_number\n";

# Output:
# Edition number: Druhé vydání
# Cleaned edition number: 2

EXAMPLE4

use strict;
use warnings;

use MARC::Convert::Wikidata::Utils qw(clean_issn);

my $issn = '0585-5675 ;';
my $cleaned_issn = clean_issn($issn);

# Print out.
print "ISSN: $issn\n";
print "Cleaned ISSN: $cleaned_issn\n";

# Output:
# ISSN: 0585-5675 ;
# Cleaned ISSN: 0585-5675

EXAMPLE5

use strict;
use warnings;

use MARC::Convert::Wikidata::Utils qw(clean_number_of_pages);

my $number_of_pages = '575 s. ;';
my $cleaned_number_of_pages = clean_number_of_pages($number_of_pages);

# Print out.
print "Number of pages: $number_of_pages\n";
print "Cleaned number of pages: $cleaned_number_of_pages\n";

# Output:
# Number of pages: 575 s. ;
# Cleaned number of pages: 575

DEPENDENCIES

Exporter, List::Util, Readonly, Roman, Unicode::UTF8.

REPOSITORY

https://github.com/michal-josef-spacek/MARC-Convert-Wikidata

AUTHOR

Michal Josef Špaček mailto:skim@cpan.org

http://skim.cz

LICENSE AND COPYRIGHT

© 2021-2025 Michal Josef Špaček

BSD 2-Clause License

VERSION

0.22