MetadataParser.cpp 33.1 KB
Newer Older
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
/*****************************************************************************
 * Media Library
 *****************************************************************************
 * Copyright (C) 2015 Hugo Beauzée-Luyssen, Videolabs
 *
 * Authors: Hugo Beauzée-Luyssen<hugo@beauzee.fr>
 *
 * This program is free software; you can redistribute it and/or modify it
 * under the terms of the GNU Lesser General Public License as published by
 * the Free Software Foundation; either version 2.1 of the License, or
 * (at your option) any later version.
 *
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
 * GNU Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public License
 * along with this program; if not, write to the Free Software Foundation,
 * Inc., 51 Franklin Street, Fifth Floor, Boston MA 02110-1301, USA.
 *****************************************************************************/

23
24
25
26
#if HAVE_CONFIG_H
# include "config.h"
#endif

27
28
29
30
31
#include "MetadataParser.h"
#include "Album.h"
#include "AlbumTrack.h"
#include "Artist.h"
#include "File.h"
32
33
34
#include "filesystem/IDevice.h"
#include "filesystem/IDirectory.h"
#include "Folder.h"
35
#include "Genre.h"
36
#include "Media.h"
37
#include "Playlist.h"
38
#include "Show.h"
39
#include "utils/Directory.h"
40
#include "utils/Filename.h"
41
#include "utils/Url.h"
42
#include "utils/ModificationsNotifier.h"
43
44
45
#include "discoverer/FsDiscoverer.h"
#include "discoverer/probe/PathProbe.h"

46
#include <cstdlib>
47

48
49
50
namespace medialibrary
{

51
MetadataParser::MetadataParser()
52
53
    : m_ml( nullptr )
    , m_previousFolderId( 0 )
54
55
56
{
}

57
bool MetadataParser::cacheUnknownArtist()
58
{
59
    m_unknownArtist = Artist::fetch( m_ml, UnknownArtistID );
60
61
62
63
64
    if ( m_unknownArtist == nullptr )
        LOG_ERROR( "Failed to cache unknown artist" );
    return m_unknownArtist != nullptr;
}

65
66
67
68
bool MetadataParser::initialize( MediaLibrary* ml)
{
    m_ml = ml;
    m_notifier = ml->getNotifier();
69
    return cacheUnknownArtist();
70
71
}

72
int MetadataParser::toInt( parser::Task::Item& item, parser::Task::Item::Metadata meta )
73
{
74
    auto str = item.meta( meta );
75
76
77
78
79
80
81
82
    if ( str.empty() == false )
    {
        try
        {
            return std::stoi( str );
        }
        catch( std::logic_error& ex)
        {
83
            LOG_WARN( "Invalid meta #",
84
                      static_cast<typename std::underlying_type<parser::Task::Item::Metadata>::type>( meta ),
85
                      " provided (", str, "): ", ex.what() );
86
87
88
89
90
        }
    }
    return 0;
}

91
parser::Task::Status MetadataParser::run( parser::Task::Item& item )
92
{
93
    bool alreadyInParser = false;
94
    int nbSubitem = item.subItems().size();
95
96
97
    // Assume that file containing subitem(s) is a Playlist
    if ( nbSubitem > 0 )
    {
98
        auto res = addPlaylistMedias( item );
99
100
101
        if ( res == false ) // playlist addition may fail due to constraint violation
            return parser::Task::Status::Fatal;

102
        assert( item.file() != nullptr );
103
        return parser::Task::Status::Completed;
104
105
    }

106
    if ( item.file() == nullptr )
107
    {
108
        assert( item.media() == nullptr );
109
        // Try to create Media & File
110
        auto mrl = item.mrl();
111
        try
112
        {
113
            auto t = m_ml->getConn()->newTransaction();
114
            LOG_INFO( "Adding ", mrl );
115
116
            auto m = Media::create( m_ml, IMedia::Type::Unknown, utils::file::fileName( mrl ) );
            if ( m == nullptr )
117
            {
118
                LOG_ERROR( "Failed to add media ", mrl, " to the media library" );
119
120
121
                return parser::Task::Status::Fatal;
            }
            // For now, assume all media are made of a single file
122
123
124
            auto file = m->addFile( *item.fileFs(),
                                    item.parentFolder()->id(),
                                    item.parentFolderFs()->device()->isRemovable(),
125
126
                                    File::Type::Main );
            if ( file == nullptr )
127
            {
128
                LOG_ERROR( "Failed to add file ", mrl, " to media #", m->id() );
129
130
                return parser::Task::Status::Fatal;
            }
131
            item.setMedia( std::move( m ) );
132
133
            // Will invoke ITaskCb::updateFileId to upadte m_fileId & its
            // representation in DB
134
            item.setFile( std::move( file ) );
135
            t->commit();
136
        }
137
138
        // Voluntarily trigger an exception for a valid, but less common case, to avoid database overhead
        catch ( sqlite::errors::ConstraintViolation& ex )
139
        {
140
141
142
            LOG_INFO( "Creation of Media & File failed because ", ex.what(),
                      ". Assuming this task is a duplicate" );
            // Try to retrieve file & Media from database
143
            auto fileInDB = File::fromMrl( m_ml, mrl );
144
145
            if ( fileInDB == nullptr ) // The file is no longer present in DB, gracefully delete task
            {
146
                LOG_ERROR( "File ", mrl, " no longer present in DB, aborting");
147
148
                return parser::Task::Status::Fatal;
            }
149
150
            auto media = fileInDB->media();
            if ( media == nullptr ) // Without a media, we cannot go further
151
                return parser::Task::Status::Fatal;
152
153
            item.setFile( std::move( fileInDB ) );
            item.setMedia( std::move( media ) );
154

155
            alreadyInParser = true;
156
        }
157
    }
158
    else if ( item.media() == nullptr )
159
160
161
162
163
164
165
166
    {
        // If we have a file but no media, this is a problem, we can analyze as
        // much as we want, but won't be able to store anything.
        // Keep in mind that if we are in this code path, we are not analyzing
        // a playlist.
        assert( false );
        return parser::Task::Status::Fatal;
    }
167

168
169
    if ( item.parentPlaylist() != nullptr )
        item.parentPlaylist()->add( item.media()->id(), item.parentPlaylistIndex() );
170
171

    if ( alreadyInParser == true )
172
        return parser::Task::Status::Discarded;
173

174
    const auto& tracks = item.tracks();
175
176

    if ( tracks.empty() == true )
177
        return parser::Task::Status::Fatal;
178

179
    bool isAudio = true;
180
    {
181
        using TracksT = decltype( tracks );
182
        sqlite::Tools::withRetries( 3, [this, &isAudio, &item]( TracksT tracks ) {
183
            auto t = m_ml->getConn()->newTransaction();
184
            for ( const auto& track : tracks )
185
            {
186
                if ( track.type == parser::Task::Item::Track::Type::Video )
187
                {
188
                    item.media()->addVideoTrack( track.codec, track.v.width, track.v.height,
189
190
191
                                          static_cast<float>( track.v.fpsNum ) /
                                              static_cast<float>( track.v.fpsDen ),
                                          track.language, track.description );
192
193
                    isAudio = false;
                }
194
                else
195
                {
196
                    assert( track.type == parser::Task::Item::Track::Type::Audio );
197
                    item.media()->addAudioTrack( track.codec, track.bitrate,
198
199
                                               track.a.rate, track.a.nbChannels,
                                               track.language, track.description );
200
                }
201
            }
202
            item.media()->setDuration( item.duration() );
203
204
            t->commit();
        }, std::move( tracks ) );
205
206
207
    }
    if ( isAudio == true )
    {
208
        if ( parseAudioFile( item ) == false )
209
210
211
212
            return parser::Task::Status::Fatal;
    }
    else
    {
213
        if (parseVideoFile( item ) == false )
214
215
            return parser::Task::Status::Fatal;
    }
216

217
    if ( item.file()->isDeleted() == true || item.media()->isDeleted() == true )
218
219
        return parser::Task::Status::Fatal;

220
    m_notifier->notifyMediaCreation( item.media() );
221
222
223
    return parser::Task::Status::Success;
}

224
225
/* Playlist files */

226
bool MetadataParser::addPlaylistMedias( parser::Task::Item& item ) const
227
{
228
    const auto& mrl = item.mrl();
229
    LOG_INFO( "Try to import ", mrl, " as a playlist" );
230
    std::shared_ptr<Playlist> playlistPtr;
231
    if ( item.file() != nullptr )
232
    {
233
234
235
236
237
        // We are most likely re-scanning a file representing a playlist.
        // If a task has a file, it means the playlist & the associated file have
        // been created.
        std::string req = "SELECT * FROM " + policy::PlaylistTable::Name +
                " WHERE file_id = ?";
238
        playlistPtr = Playlist::fetch( m_ml, req, item.file()->id() );
239
240
241
242
243
244
245
        if ( playlistPtr == nullptr )
        {
            // The playlist had to be created, something is very wrong, give up
            // FIXME: Check that the task will be deleted.
            assert( false );
            return false;
        }
246
    }
247
    else
248
    {
249
        auto playlistName = item.meta( parser::Task::Item::Metadata::Title );
250
251
252
253
254
255
256
257
258
259
        if ( playlistName.empty() == true )
            playlistName = utils::url::decode( utils::file::fileName( mrl ) );
        auto t = m_ml->getConn()->newTransaction();
        playlistPtr = Playlist::create( m_ml, playlistName );
        if ( playlistPtr == nullptr )
        {
            LOG_ERROR( "Failed to create playlist ", mrl, " to the media library" );
            return false;
        }

260
261
262
        auto file = playlistPtr->addFile( *item.fileFs(),
                                          item.parentFolder()->id(),
                                          item.parentFolderFs()->device()->isRemovable() );
263
264
265
266
267
        if ( file == nullptr )
        {
            LOG_ERROR( "Failed to add playlist file ", mrl );
            return false;
        }
268
269
        // Will invoke ITaskCb::updateFileId to upadte m_fileId & its
        // representation in DB
270
        item.setFile( std::move( file ) );
271
        t->commit();
272
    }
273
274
275
276
277
    // Now regardless of if the playlist is re-scanned or discovered from the
    // first time, just schedule all members for insertion. media & files will
    // be recreated if need be, and appropriate entries in PlaylistMediaRelation
    // table will be recreated to link things together.

278
    auto subitems = item.subItems();
279
    for ( const auto& subItem : subitems ) // FIXME: Interrupt loop if paused
280
        addPlaylistElement( item, playlistPtr, subItem );
281
282
283
284

    return true;
}

285
286
void MetadataParser::addPlaylistElement( parser::Task::Item& item,
                                         std::shared_ptr<Playlist> playlistPtr,
287
                                         const parser::Task::Item& subitem ) const
288
{
289
    const auto& mrl = subitem.mrl();
290
    LOG_INFO( "Try to add ", mrl, " to the playlist ", mrl );
291
292
293
    auto media = m_ml->media( mrl );
    if ( media != nullptr )
    {
294
        LOG_INFO( "Media for ", mrl, " already exists, adding it to the playlist ", mrl );
295
        playlistPtr->add( media->id(), subitem.parentPlaylistIndex() );
296
297
298
299
300
301
302
303
304
        return;
    }
    // Create Media, etc.
    auto fsFactory = m_ml->fsFactoryForMrl( mrl );

    if ( fsFactory == nullptr ) // Media not supported by any FsFactory, registering it as external
    {
        auto t2 = m_ml->getConn()->newTransaction();
        auto externalMedia = Media::create( m_ml, IMedia::Type::Unknown, utils::url::encode(
305
                subitem.meta( parser::Task::Item::Metadata::Title ) ) );
306
307
        if ( externalMedia == nullptr )
        {
308
            LOG_ERROR( "Failed to create external media for ", mrl, " in the playlist ", item.mrl() );
309
310
311
312
313
            return;
        }
        // Assuming that external mrl present in playlist file is a main media resource
        auto externalFile = externalMedia->addExternalMrl( mrl, IFile::Type::Main );
        if ( externalFile == nullptr )
314
            LOG_ERROR( "Failed to create external file for ", mrl, " in the playlist ", item.mrl() );
315
        playlistPtr->add( externalMedia->id(), subitem.parentPlaylistIndex() );
316
317
318
319
320
321
322
323
324
325
326
327
328
        t2->commit();
        return;
    }
    bool isDirectory;
    try
    {
        isDirectory = utils::fs::isDirectory( utils::file::toLocalPath( mrl ) );
    }
    catch ( std::system_error& ex )
    {
        LOG_ERROR( ex.what() );
        return;
    }
329
    LOG_INFO( "Importing ", isDirectory ? "folder " : "file ", mrl, " in the playlist ", item.mrl() );
330
331
332
333
    auto directoryMrl = utils::file::directory( mrl );
    auto parentFolder = Folder::fromMrl( m_ml, directoryMrl );
    bool parentKnown = parentFolder != nullptr;

334
335
336
337
338
339
340
341
    // The minimal entrypoint must be a device mountpoint
    auto device = fsFactory->createDeviceFromMrl( mrl );
    if ( device == nullptr )
    {
        LOG_ERROR( "Can't add a local folder with unknown storage device. ");
        return;
    }
    auto entryPoint = device->mountpoint();
342
343
    if ( parentKnown == false && Folder::fromMrl( m_ml, entryPoint ) != nullptr )
    {
344
345
346
347
        auto probePtr = std::unique_ptr<prober::PathProbe>(
                    new prober::PathProbe{ utils::file::stripScheme( mrl ),
                       isDirectory, std::move( playlistPtr ), parentFolder,
                       utils::file::stripScheme( directoryMrl ), subitem.parentPlaylistIndex(), true } );
348
        FsDiscoverer discoverer( fsFactory, m_ml, nullptr, std::move( probePtr ) );
349
350
351
        discoverer.reload( entryPoint );
        return;
    }
352
353
354
355
    auto probePtr = std::unique_ptr<prober::PathProbe>(
                new prober::PathProbe{ utils::file::stripScheme( mrl ),
                   isDirectory, std::move( playlistPtr ), parentFolder,
                   utils::file::stripScheme( directoryMrl ), subitem.parentPlaylistIndex(), false } );
356
    FsDiscoverer discoverer( fsFactory, m_ml, nullptr, std::move( probePtr ) );
357
358
359
    if ( parentKnown == false )
    {
        discoverer.discover( entryPoint );
360
361
362
        auto entryFolder = Folder::fromMrl( m_ml, entryPoint );
        if ( entryFolder != nullptr )
            Folder::excludeEntryFolder( m_ml, entryFolder->id() );
363
364
365
366
367
        return;
    }
    discoverer.reload( directoryMrl );
}

368
369
/* Video files */

370
bool MetadataParser::parseVideoFile( parser::Task::Item& item ) const
371
{
372
    auto media = item.media().get();
373
    media->setType( IMedia::Type::Video );
374
    const auto& title = item.meta( parser::Task::Item::Metadata::Title );
375
    if ( title.length() == 0 )
376
        return true;
377

378
379
    const auto& showName = item.meta( parser::Task::Item::Metadata::ShowName );
    const auto& artworkMrl = item.meta( parser::Task::Item::Metadata::ArtworkUrl );
380

381
    return sqlite::Tools::withRetries( 3, [this, &showName, &title, &item, &artworkMrl]() {
382
        auto t = m_ml->getConn()->newTransaction();
383
        item.media()->setTitleBuffered( title );
384

385
        if ( artworkMrl.empty() == false )
386
            item.media()->setThumbnail( artworkMrl, Thumbnail::Origin::Media );
387

388
389
        if ( showName.length() != 0 )
        {
390
            auto show = m_ml->show( showName );
391
            if ( show == nullptr )
392
393
394
395
396
            {
                show = m_ml->createShow( showName );
                if ( show == nullptr )
                    return false;
            }
397
            auto episode = toInt( item, parser::Task::Item::Metadata::Episode );
398
399
400
            if ( episode != 0 )
            {
                std::shared_ptr<Show> s = std::static_pointer_cast<Show>( show );
401
                s->addEpisode( *item.media(), title, episode );
402
            }
403
404
405
406
407
        }
        else
        {
            // How do we know if it's a movie or a random video?
        }
408
        item.media()->save();
409
410
411
        t->commit();
        return true;
    });
412
413
414
415
416
    return true;
}

/* Audio files */

417
bool MetadataParser::parseAudioFile( parser::Task::Item& item )
418
{
419
    item.media()->setType( IMedia::Type::Audio );
420

421
    auto artworkMrl = item.meta( parser::Task::Item::Metadata::ArtworkUrl );
422
    if ( artworkMrl.empty() == false )
423
    {
424
        item.media()->setThumbnail( artworkMrl, Thumbnail::Origin::Media );
425
426
427
428
429
        // Don't use an attachment as default artwork for album/artists
        if ( utils::file::schemeIs( "attachment", artworkMrl ) )
            artworkMrl.clear();
    }

430

431
432
    auto genre = handleGenre( item );
    auto artists = findOrCreateArtist( item );
433
434
    if ( artists.first == nullptr && artists.second == nullptr )
        return false;
435
436
    auto album = findAlbum( item, artists.first, artists.second );
    return sqlite::Tools::withRetries( 3, [this, &item, &artists]( std::string artworkMrl,
437
438
                                                  std::shared_ptr<Album> album, std::shared_ptr<Genre> genre ) {
        auto t = m_ml->getConn()->newTransaction();
439
        if ( album == nullptr )
440
        {
441
            const auto& albumName = item.meta( parser::Task::Item::Metadata::Album );
442
443
444
445
446
447
448
449
450
            int64_t thumbnailId = 0;
            if ( artworkMrl.empty() == false )
            {
                auto thumbnail = Thumbnail::create( m_ml, artworkMrl,
                                                    Thumbnail::Origin::Album );
                if ( thumbnail != nullptr )
                    thumbnailId = thumbnail->id();
            }
            album = m_ml->createAlbum( albumName, thumbnailId );
451
452
453
454
455
            if ( album == nullptr )
                return false;
            m_notifier->notifyAlbumCreation( album );
        }
        // If we know a track artist, specify it, otherwise, fallback to the album/unknown artist
456
        auto track = handleTrack( album, item, artists.second ? artists.second : artists.first,
457
458
                                  genre.get() );

459
460
        auto res = link( *item.media(), album, artists.first, artists.second );
        item.media()->save();
461
462
463
        t->commit();
        return res;
    }, std::move( artworkMrl ), std::move( album ), std::move( genre ) );
464
465
}

466
std::shared_ptr<Genre> MetadataParser::handleGenre( parser::Task::Item& item ) const
467
{
468
    const auto& genreStr = item.meta( parser::Task::Item::Metadata::Genre );
469
    if ( genreStr.length() == 0 )
470
        return nullptr;
471
    auto genre = Genre::fromName( m_ml, genreStr );
472
473
    if ( genre == nullptr )
    {
474
        genre = Genre::create( m_ml, genreStr );
475
        if ( genre == nullptr )
476
            LOG_ERROR( "Failed to get/create Genre", genreStr );
477
478
479
480
    }
    return genre;
}

481
/* Album handling */
482

483
std::shared_ptr<Album> MetadataParser::findAlbum( parser::Task::Item& item, std::shared_ptr<Artist> albumArtist,
484
                                                    std::shared_ptr<Artist> trackArtist )
485
{
486
    const auto& albumName = item.meta( parser::Task::Item::Metadata::Album );
487
    if ( albumName.empty() == true )
488
    {
489
490
        if ( albumArtist != nullptr )
            return albumArtist->unknownAlbum();
491
        if ( trackArtist != nullptr )
492
493
            return trackArtist->unknownAlbum();
        return m_unknownArtist->unknownAlbum();
494
495
    }

496
    if ( m_previousAlbum != nullptr && albumName == m_previousAlbum->title() &&
497
         m_previousFolderId != 0 && item.file()->folderId() == m_previousFolderId )
498
499
500
501
        return m_previousAlbum;
    m_previousAlbum.reset();
    m_previousFolderId = 0;

502
503
    // Album matching depends on the difference between artist & album artist.
    // Specificaly pass the albumArtist here.
504
505
    static const std::string req = "SELECT * FROM " + policy::AlbumTable::Name +
            " WHERE title = ?";
506
    auto albums = Album::fetchAll<Album>( m_ml, req, albumName );
507
508
509
510

    if ( albums.size() == 0 )
        return nullptr;

511
512
    const auto discTotal = toInt( item, parser::Task::Item::Metadata::DiscTotal );
    const auto discNumber = toInt( item, parser::Task::Item::Metadata::DiscNumber );
513
514
515
516
517
    /*
     * Even if we get only 1 album, we need to filter out invalid matches.
     * For instance, if we have already inserted an album "A" by an artist "john"
     * but we are now trying to handle an album "A" by an artist "doe", not filtering
     * candidates would yield the only "A" album we know, while we should return
518
     * nullptr, so the link() method can create a new one.
519
520
521
522
     */
    for ( auto it = begin( albums ); it != end( albums ); )
    {
        auto a = (*it).get();
523
        auto candidateAlbumArtist = a->albumArtist();
524
525
526
527
        // When we find an album, we will systematically assign an artist to it.
        // Not having an album artist (even it it's only a temporary one in the
        // case of a compilation album) is not expected at all.
        assert( candidateAlbumArtist != nullptr );
528
529
530
531
        if ( albumArtist != nullptr )
        {
            // We assume that an album without album artist is a positive match.
            // At the end of the day, without proper tags, there's only so much we can do.
532
            if ( candidateAlbumArtist->id() != albumArtist->id() )
533
534
535
536
537
538
539
540
541
542
543
            {
                it = albums.erase( it );
                continue;
            }
        }
        // If this is a multidisc album, assume it could be in a multiple amount of folders.
        // Since folders can come in any order, we can't assume the first album will be the
        // first media we see. If the discTotal or discNumber meta are provided, that's easy. If not,
        // we assume that another CD with the same name & artists, and a disc number > 1
        // denotes a multi disc album
        // Check the first case early to avoid fetching tracks if unrequired.
544
        if ( discTotal > 1 || discNumber > 1 )
545
546
547
548
        {
            ++it;
            continue;
        }
549
        const auto tracks = a->cachedTracks();
550
551
552
553
554
555
556
        // If there is no tracks to compare with, we just have to hope this will be the only valid
        // album match
        if ( tracks.size() == 0 )
        {
            ++it;
            continue;
        }
557
558

        auto multiDisc = false;
559
560
        auto multipleArtists = false;
        int64_t previousArtistId = trackArtist != nullptr ? trackArtist->id() : 0;
561
562
563
564
        for ( auto& t : tracks )
        {
            auto at = t->albumTrack();
            assert( at != nullptr );
565
566
567
            if ( at == nullptr )
                continue;
            if ( at->discNumber() > 1 )
568
                multiDisc = true;
569
570
571
572
573
            if ( previousArtistId != 0 && previousArtistId != at->artist()->id() )
                multipleArtists = true;
            previousArtistId = at->artist()->id();
            // We now know enough about the album, we can stop looking at its tracks
            if ( multiDisc == true && multipleArtists == true )
574
575
576
577
578
579
580
581
                break;
        }
        if ( multiDisc )
        {
            ++it;
            continue;
        }

582
        // Assume album files will be in the same folder.
583
        auto newFileFolder = utils::file::directory( item.file()->mrl() );
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
        auto trackFiles = tracks[0]->files();
        bool differentFolder = false;
        for ( auto& f : trackFiles )
        {
            auto candidateFolder = utils::file::directory( f->mrl() );
            if ( candidateFolder != newFileFolder )
            {
                differentFolder = true;
                break;
            }
        }
        // We now have a candidate by the same artist in the same folder, assume it to be
        // a positive match.
        if ( differentFolder == false )
        {
            ++it;
            continue;
        }

603
604
605
606
        // Attempt to discriminate by date, but only for the same artists.
        // Not taking the artist in consideration would cause compilation to
        // create multiple albums, especially when track are only partially
        // tagged with a year.
607
        if ( multipleArtists == false )
608
        {
609
            auto candidateDate = item.meta( parser::Task::Item::Metadata::Date );
610
            if ( candidateDate.empty() == false )
611
            {
612
613
614
615
616
617
618
619
620
621
622
623
624
                try
                {
                    unsigned int year = std::stoi( candidateDate );
                    if ( year != a->releaseYear() )
                        it = albums.erase( it );
                    else
                        ++it;
                    continue;
                }
                catch (...)
                {
                    // Date wasn't helpful, simply ignore the error and continue
                }
625
626
            }
        }
627
628
629
630
631
632
633
634
635
        // The candidate is :
        // - in a different folder
        // - not a multidisc album
        // - Either:
        //      - from the same artist & without a date to discriminate
        //      - from the same artist & with a different date
        //      - from different artists
        // Assume it's a negative match.
        it = albums.erase( it );
636
637
638
639
640
    }
    if ( albums.size() == 0 )
        return nullptr;
    if ( albums.size() > 1 )
    {
641
        LOG_WARN( "Multiple candidates for album ", albumName, ". Selecting first one out of luck" );
642
    }
643
    m_previousFolderId = item.file()->folderId();
644
645
    m_previousAlbum = albums[0];
    return albums[0];
646
647
648
649
}

///
/// \brief MetadataParser::handleArtists Returns Artist's involved on a track
650
/// \param task The current parser task
651
652
653
654
/// \return A pair containing:
/// The album artist as a first element
/// The track artist as a second element, or nullptr if it is the same as album artist
///
655
std::pair<std::shared_ptr<Artist>, std::shared_ptr<Artist>> MetadataParser::findOrCreateArtist( parser::Task::Item& item ) const
656
657
658
{
    std::shared_ptr<Artist> albumArtist;
    std::shared_ptr<Artist> artist;
659
    static const std::string req = "SELECT * FROM " + policy::ArtistTable::Name + " WHERE name = ?";
660

661
662
    const auto& albumArtistStr = item.meta( parser::Task::Item::Metadata::AlbumArtist );
    const auto& artistStr = item.meta( parser::Task::Item::Metadata::Artist );
663
    if ( albumArtistStr.empty() == true && artistStr.empty() == true )
664
    {
665
        return {m_unknownArtist, m_unknownArtist};
666
667
    }

668
    if ( albumArtistStr.empty() == false )
669
    {
670
        albumArtist = Artist::fetch( m_ml, req, albumArtistStr );
671
672
        if ( albumArtist == nullptr )
        {
673
            albumArtist = m_ml->createArtist( albumArtistStr );
674
675
            if ( albumArtist == nullptr )
            {
676
                LOG_ERROR( "Failed to create new artist ", albumArtistStr );
677
678
                return {nullptr, nullptr};
            }
679
            m_notifier->notifyArtistCreation( albumArtist );
680
681
        }
    }
682
    if ( artistStr.empty() == false && artistStr != albumArtistStr )
683
    {
684
        artist = Artist::fetch( m_ml, req, artistStr );
685
686
        if ( artist == nullptr )
        {
687
            artist = m_ml->createArtist( artistStr );
688
689
            if ( artist == nullptr )
            {
690
                LOG_ERROR( "Failed to create new artist ", artistStr );
691
692
                return {nullptr, nullptr};
            }
693
            m_notifier->notifyArtistCreation( artist );
694
695
696
697
698
699
700
        }
    }
    return {albumArtist, artist};
}

/* Tracks handling */

701
std::shared_ptr<AlbumTrack> MetadataParser::handleTrack( std::shared_ptr<Album> album, parser::Task::Item& item,
702
                                                         std::shared_ptr<Artist> artist, Genre* genre ) const
703
{
704
705
    assert( sqlite::Transaction::transactionInProgress() == true );

706
707
708
    auto title = item.meta( parser::Task::Item::Metadata::Title );
    const auto trackNumber = toInt( item, parser::Task::Item::Metadata::TrackNumber );
    const auto discNumber = toInt( item, parser::Task::Item::Metadata::DiscNumber );
709
710
711
    if ( title.empty() == true )
    {
        LOG_WARN( "Failed to get track title" );
712
        if ( trackNumber != 0 )
713
714
        {
            title = "Track #";
715
            title += std::to_string( trackNumber );
716
717
718
        }
    }
    if ( title.empty() == false )
719
        item.media()->setTitleBuffered( title );
720

721
    auto track = std::static_pointer_cast<AlbumTrack>( album->addTrack( item.media(), trackNumber,
722
                                                                        discNumber, artist->id(),
723
                                                                        genre ) );
724
725
726
727
728
    if ( track == nullptr )
    {
        LOG_ERROR( "Failed to create album track" );
        return nullptr;
    }
729

730
    const auto& releaseDate = item.meta( parser::Task::Item::Metadata::Date );
731
    if ( releaseDate.empty() == false )
732
    {
733
        auto releaseYear = atoi( releaseDate.c_str() );
734
        item.media()->setReleaseDate( releaseYear );
735
736
737
738
739
        // Let the album handle multiple dates. In order to do this properly, we need
        // to know if the date has been changed before, which can be known only by
        // using Album class internals.
        album->setReleaseYear( releaseYear, false );
    }
740
    m_notifier->notifyAlbumTrackCreation( track );
741
742
743
744
745
746
    return track;
}

/* Misc */

bool MetadataParser::link( Media& media, std::shared_ptr<Album> album,
747
                               std::shared_ptr<Artist> albumArtist, std::shared_ptr<Artist> artist )
748
{
749
    if ( albumArtist == nullptr )
750
751
    {
        assert( artist != nullptr );
752
        albumArtist = artist;
753
    }
754
    assert( album != nullptr );
755

756
757
    auto albumThumbnail = album->thumbnail();

758
759
760
761
    // We might modify albumArtist later, hence handle thumbnails before.
    // If we have an albumArtist (meaning the track was properly tagged, we
    // can assume this artist is a correct match. We can use the thumbnail from
    // the current album for the albumArtist, if none has been set before.
762
763
764
765
    // Although we don't want to do this for unknown/various artists, as the
    // thumbnail wouldn't reflect those "special" artists
    if ( albumArtist != nullptr && albumArtist->id() != UnknownArtistID &&
         albumArtist->id() != VariousArtistID &&
766
767
768
769
770
771
772
773
774
775
776
777
778
779
         albumThumbnail != nullptr )
    {
        auto albumArtistThumbnail = albumArtist->thumbnail();
        // If the album artist has no thumbnail, let's assign it
        if ( albumArtistThumbnail == nullptr )
        {
            albumArtist->setArtworkMrl( albumThumbnail->mrl(), Thumbnail::Origin::AlbumArtist );
        }
        else if ( albumArtistThumbnail->origin() == Thumbnail::Origin::Artist )
        {
            // We only want to change the thumbnail if it was assigned from an
            // album this artist was only featuring on
        }
    }
780

781
782
783
784
    // Until we have a better artwork extraction/assignation, simply do the same
    // for artists
    if ( artist != nullptr && artist->id() != UnknownArtistID &&
         artist->id() != VariousArtistID &&
785
786
787
788
         albumThumbnail != nullptr && artist->thumbnail() == nullptr )
    {
        artist->setArtworkMrl( album->artworkMrl(), Thumbnail::Origin::Artist );
    }
789

790
791
792
793
794
795
796
797
798
799
800
801
802
    if ( albumArtist != nullptr )
        albumArtist->addMedia( media );
    if ( artist != nullptr && ( albumArtist == nullptr || albumArtist->id() != artist->id() ) )
        artist->addMedia( media );

    auto currentAlbumArtist = album->albumArtist();

    // If we have no main artist yet, that's easy, we need to assign one.
    if ( currentAlbumArtist == nullptr )
    {
        // We don't know if the artist was tagged as artist or albumartist, however, we simply add it
        // as the albumartist until proven we were wrong (ie. until one of the next tracks
        // has a different artist)
803
        album->setAlbumArtist( albumArtist );
804
805
        // Always add the album artist as an artist
        album->addArtist( albumArtist );
806
807
808
        // Always update the album artist number of tracks.
        // The artist might be different, and will be handled a few lines below
        albumArtist->updateNbTrack( 1 );
809
        if ( artist != nullptr )
810
811
812
813
814
        {
            // If the album artist is not the artist, we need to update the
            // album artist track count as well.
            if ( albumArtist->id() != artist->id() )
                artist->updateNbTrack( 1 );
815
            album->addArtist( artist );
816
        }
817
818
819
    }
    else
    {
820
        // We have more than a single artist on this album, fallback to various artists
821
822
        if ( albumArtist->id() != currentAlbumArtist->id() )
        {
823
824
            if ( m_variousArtists == nullptr )
                m_variousArtists = Artist::fetch( m_ml, VariousArtistID );
825
826
827
828
829
830
831
832
833
834
835
836
837
838
            // If we already switched to various artist, no need to do it again
            if ( m_variousArtists->id() != currentAlbumArtist->id() )
            {
                // All tracks from this album must now also be reflected in various
                // artist number of tracks
                m_variousArtists->updateNbTrack( album->nbTracks() );
                album->setAlbumArtist( m_variousArtists );
            }
            // However we always need to bump the various artist number of tracks
            else
            {
                m_variousArtists->updateNbTrack( 1 );
            }
            // Add this artist as "featuring".
839
840
841
842
            album->addArtist( albumArtist );
        }
        if ( artist != nullptr && artist->id() != albumArtist->id() )
        {
843
844
           album->addArtist( artist );
           artist->updateNbTrack( 1 );
845
        }
846
        albumArtist->updateNbTrack( 1 );
847
848
849
850
851
852
853
854
855
    }

    return true;
}

const char* MetadataParser::name() const
{
    return "Metadata";
}
856
857
858
859
860
861
862
863
864
865

uint8_t MetadataParser::nbThreads() const
{
//    auto nbProcs = std::thread::hardware_concurrency();
//    if ( nbProcs == 0 )
//        return 1;
//    return nbProcs;
    // Let's make this code thread-safe first :)
    return 1;
}
866

867
void MetadataParser::onFlushing()
868
869
870
871
872
873
{
    m_variousArtists = nullptr;
    m_previousAlbum = nullptr;
    m_previousFolderId = 0;
}

874
void MetadataParser::onRestarted()
875
876
{
    // Reset locally cached entities
877
    cacheUnknownArtist();
878
879
}

880
bool MetadataParser::isCompleted( const parser::Task& task ) const
881
{
882
    // We always need to run this task if the metadata extraction isn't completed
883
    return task.isStepCompleted( parser::Task::ParserStep::MetadataAnalysis );
884
885
}

886
887
888
889
890
parser::Task::ParserStep MetadataParser::targetedStep() const
{
    return parser::Task::ParserStep::MetadataAnalysis;
}

891
}