You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
55 lines
1.9 KiB
55 lines
1.9 KiB
#!/usr/bin/env python
|
|
# -*- coding: utf-8 -*-
|
|
#
|
|
# GuessIt - A library for guessing information from filenames
|
|
# Copyright (c) 2012 Nicolas Wack <wackou@gmail.com>
|
|
#
|
|
# GuessIt is free software; you can redistribute it and/or modify it under
|
|
# the terms of the Lesser GNU General Public License as published by
|
|
# the Free Software Foundation; either version 3 of the License, or
|
|
# (at your option) any later version.
|
|
#
|
|
# GuessIt is distributed in the hope that it will be useful,
|
|
# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
# Lesser GNU General Public License for more details.
|
|
#
|
|
# You should have received a copy of the Lesser GNU General Public License
|
|
# along with this program. If not, see <http://www.gnu.org/licenses/>.
|
|
#
|
|
|
|
from __future__ import unicode_literals
|
|
from guessit import Guess
|
|
from guessit.transfo import SingleNodeGuesser
|
|
from guessit.language import search_language
|
|
import logging
|
|
|
|
log = logging.getLogger(__name__)
|
|
|
|
|
|
def guess_language(string, node, skip=None):
|
|
if skip:
|
|
relative_skip = []
|
|
for entry in skip:
|
|
node_idx = entry['node_idx']
|
|
span = entry['span']
|
|
if node_idx == node.node_idx[:len(node_idx)]:
|
|
relative_span = (span[0] - node.offset + 1, span[1] - node.offset + 1)
|
|
relative_skip.append(relative_span)
|
|
skip = relative_skip
|
|
|
|
language, span, confidence = search_language(string, skip=skip)
|
|
if language:
|
|
return (Guess({'language': language},
|
|
confidence=confidence,
|
|
raw= string[span[0]:span[1]]),
|
|
span)
|
|
|
|
return None, None
|
|
|
|
guess_language.use_node = True
|
|
|
|
|
|
def process(mtree, *args, **kwargs):
|
|
SingleNodeGuesser(guess_language, None, log, *args, **kwargs).process(mtree)
|
|
# Note: 'language' is promoted to 'subtitleLanguage' in the post_process transfo
|
|
|