hydrus/include/ClientDB.py

import ClientData
import ClientDefaults
import ClientFiles
import ClientImporting
import ClientMedia
import ClientRatings
import ClientThreading
import collections
import hashlib
import httplib
import itertools
import json
import HydrusConstants as HC
import HydrusDB
import ClientDownloading
import ClientImageHandling
import HydrusExceptions
import HydrusFileHandling
import HydrusImageHandling
import HydrusNATPunch
import HydrusPaths
import HydrusSerialisable
import HydrusTagArchive
import HydrusTags
import HydrusThreading
import ClientConstants as CC
import lz4
import numpy
import os
import psutil
import Queue
import random
import shutil
import sqlite3
import stat
import sys
import threading
import time
import traceback
import wx
import yaml
import HydrusData
import ClientSearch
import HydrusGlobals

YAML_DUMP_ID_SINGLE = 0
YAML_DUMP_ID_REMOTE_BOORU = 1
YAML_DUMP_ID_FAVOURITE_CUSTOM_FILTER_ACTIONS = 2
YAML_DUMP_ID_GUI_SESSION = 3
YAML_DUMP_ID_IMAGEBOARD = 4
YAML_DUMP_ID_IMPORT_FOLDER = 5
YAML_DUMP_ID_EXPORT_FOLDER = 6
YAML_DUMP_ID_SUBSCRIPTION = 7
YAML_DUMP_ID_LOCAL_BOORU = 8
'''
class MessageDB( object ):

    def _AddContact( self, contact ):

        ( public_key, name, host, port ) = contact.GetInfo()

        contact_key = contact.GetContactKey()

        if public_key is not None: contact_key = sqlite3.Binary( contact_key )

        self._c.execute( 'INSERT OR IGNORE INTO contacts ( contact_key, public_key, name, host, port ) VALUES ( ?, ?, ?, ?, ? );', ( contact_key, public_key, name, host, port ) )


    def _AddMessage( self, transport_message, serverside_message_key = None, forced_status = None ):

        ( contact_from, contacts_to, message_key, conversation_key, timestamp, subject, body, files ) = transport_message.GetInfo()

        if contact_from is None or contact_from.GetName() == 'Anonymous':

            contact_id_from = 1

        else:

            contact_id_from = self._GetContactId( contact_from )

            # changes whatever they want to say their name and public key is to whatever we prefer it to be
            contact_from = self._GetContact( contact_id_from )

            public_key = contact_from.GetPublicKey()

            try: transport_message.VerifyIsFromCorrectPerson( public_key )
            except:

                HydrusData.ShowText( 'received a message that did not verify' )

                return


        conversation_id = self._GetConversationId( conversation_key, subject )

        message_id = self._GetMessageId( message_key )

        result = self._c.execute( 'SELECT 1 FROM messages WHERE message_id = ?;', ( message_id, ) ).fetchone()

        if result is None:

            self._c.execute( 'INSERT OR IGNORE INTO messages ( conversation_id, message_id, contact_id_from, timestamp ) VALUES ( ?, ?, ?, ? );', ( conversation_id, message_id, contact_id_from, timestamp ) )

            self._c.execute( 'INSERT OR IGNORE INTO message_bodies ( docid, body ) VALUES ( ?, ? );', ( message_id, body ) )

            attachment_hashes = []

            if len( files ) > 0:

                for file in files:

                    ( os_file_handle, temp_path ) = HydrusPaths.GetTempPath()

                    try:

                        with open( temp_path, 'wb' ) as f: f.write( file )

                        ( result, hash ) = self._ImportFile( temp_path, override_deleted = True ) # what if the file fails?

                        attachment_hashes.append( hash )

                    finally:

                        HydrusPaths.CleanUpTempPath( os_file_handle, temp_path )


                hash_ids = self._GetHashIds( attachment_hashes )

                self._c.executemany( 'INSERT OR IGNORE INTO message_attachments ( message_id, hash_id ) VALUES ( ?, ? );', [ ( message_id, hash_id ) for hash_id in hash_ids ] )


            if forced_status is None: status = 'sent'
            else: status = forced_status

            status_id = self._GetStatusId( status )

            inboxable_contact_ids = { id for ( id, ) in self._c.execute( 'SELECT contact_id FROM message_depots;' ) }

            inbox = False

            for contact_to in contacts_to:

                contact_id_to = self._GetContactId( contact_to )

                if contact_id_to in inboxable_contact_ids:

                    self._c.execute( 'INSERT OR IGNORE INTO message_inbox ( message_id ) VALUES ( ? );', ( message_id, ) )

                    inbox = True


                self._c.execute( 'INSERT OR IGNORE INTO message_destination_map ( message_id, contact_id_to, status_id ) VALUES ( ?, ?, ? );', ( message_id, contact_id_to, status_id ) )


            destinations = [ ( contact_to, status ) for contact_to in contacts_to ]

            message = ClientConstantsMessages.Message( message_key, contact_from, destinations, timestamp, body, attachment_hashes, inbox )

            self.pub_after_commit( 'new_message', conversation_key, message )


        if serverside_message_key is not None:

            serverside_message_id = self._GetMessageId( serverside_message_key )

            self._c.execute( 'DELETE FROM message_downloads WHERE message_id = ?;', ( serverside_message_id, ) )


    def _AddMessageInfoSince( self, service_key, serverside_message_keys, statuses, new_last_check ):

        # message_keys

        service_id = self._GetServiceId( service_key )

        serverside_message_ids = set( self._GetMessageIds( serverside_message_keys ) )

        self._c.executemany( 'INSERT OR IGNORE INTO message_downloads ( service_id, message_id ) VALUES ( ?, ? );', [ ( service_id, serverside_message_id ) for serverside_message_id in serverside_message_ids ] )

        # statuses

        message_keys_dict = {}
        statuses_dict = {}

        inserts = []

        for ( message_key, contact_key, status ) in statuses:

            if message_key in message_keys_dict: message_id = message_keys_dict[ message_key ]
            else:

                message_id = self._GetMessageId( message_key )

                message_keys_dict[ message_key ] = message_id


            if status in statuses_dict: status_id = statuses_dict[ status ]
            else:

                status_id = self._GetStatusId( status )

                statuses_dict[ status ] = status_id


            inserts.append( ( message_id, sqlite3.Binary( contact_key ), status_id ) )


        # replace is important here
        self._c.executemany( 'INSERT OR REPLACE INTO incoming_message_statuses ( message_id, contact_key, status_id ) VALUES ( ?, ?, ? );', inserts )

        # finally:

        self._c.execute( 'UPDATE message_depots SET last_check = ? WHERE service_id = ?;', ( new_last_check, service_id ) )


    def _ArchiveConversation( self, conversation_key ):

        conversation_id = self._GetMessageId( conversation_key )

        message_ids = [ message_id for ( message_id, ) in self._c.execute( 'SELECT message_id FROM messages WHERE conversation_id = ?;', ( conversation_id, ) ) ]

        self._c.execute( 'DELETE FROM message_inbox WHERE message_id IN ' + HydrusData.SplayListForDB( message_ids ) + ';' )

        self.pub_after_commit( 'archive_conversation_data', conversation_key )
        self.pub_after_commit( 'archive_conversation_gui', conversation_key )

        self._DoStatusNumInbox()


    def _AssociateContact( self, service_key ):

        service_id = self._GetServiceId( service_key )

        service = self._GetService( service_id )

        private_key = service.GetPrivateKey()

        public_key = HydrusEncryption.GetPublicKey( private_key )

        contact_key = hashlib.sha256( public_key ).digest()

        contact_id = self._GetContactId( service_id )

        self._c.execute( 'UPDATE contacts SET contact_key = ?, public_key = ? WHERE contact_id = ?;', ( sqlite3.Binary( contact_key ), public_key, contact_id ) )


    def _DeleteConversation( self, conversation_key ):

        conversation_id = self._GetMessageId( conversation_key )

        message_ids = [ message_id for ( message_id, ) in self._c.execute( 'SELECT message_id FROM messages WHERE conversation_id = ?;', ( conversation_id, ) ) ]

        splayed_message_ids = HydrusData.SplayListForDB( message_ids )

        self._c.execute( 'DELETE FROM message_keys WHERE message_id IN ' + splayed_message_ids + ';' )
        self._c.execute( 'DELETE FROM message_bodies WHERE docid IN ' + splayed_message_ids + ';' )
        self._c.execute( 'DELETE FROM conversation_subjects WHERE docid IN ' + splayed_message_ids + ';' )

        self.pub_after_commit( 'delete_conversation_data', conversation_key )
        self.pub_after_commit( 'delete_conversation_gui', conversation_key )

        self._DoStatusNumInbox()


    def _DeleteDraft( self, draft_key ):

        message_id = self._GetMessageId( draft_key )

        self._c.execute( 'DELETE FROM message_keys WHERE message_id = ?;', ( message_id, ) )
        self._c.execute( 'DELETE FROM message_bodies WHERE docid = ?;', ( message_id, ) )
        self._c.execute( 'DELETE FROM conversation_subjects WHERE docid = ?;', ( message_id, ) )

        self.pub_after_commit( 'delete_draft_data', draft_key )
        self.pub_after_commit( 'delete_draft_gui', draft_key )
        self.pub_after_commit( 'notify_check_messages' )


    def _DoMessageQuery( self, query_key, search_context ):

        identity = search_context.GetIdentity()

        name = identity.GetName()

        contact_id = self._GetContactId( identity )

        system_predicates = search_context.GetSystemPredicates()

        ( inbox, archive, draft, status, contact_from, contact_to, contact_started, min_timestamp, max_timestamp ) = system_predicates.GetInfo()

        if draft:

            draft_ids = [ message_id for ( message_id, ) in self._c.execute( 'SELECT message_id FROM messages, message_drafts USING ( message_id ) WHERE contact_id_from = ?;', ( contact_id, ) ) ]

            query_message_ids = draft_ids

        else:

            sql_predicates = [ '( contact_id_from = ' + str( contact_id ) + ' OR contact_id_to = ' + str( contact_id ) + ' )' ]

            if name != 'Anonymous':

                service = self._GetService( identity )

                if not service.ReceivesAnon(): sql_predicates.append( 'contact_id_from != 1' )


            if status is not None:

                if status == 'unread': status = 'sent'

                status_id = self._GetStatusId( status )

                sql_predicates.append( '( contact_id_to = ' + str( contact_id ) + ' AND status_id = ' + str( status_id ) + ')' )


            if contact_from is not None:

                contact_id_from = self._GetContactId( contact_from )

                sql_predicates.append( 'contact_id_from = ' + str( contact_id_from ) )


            if contact_to is not None:

                contact_id_to = self._GetContactId( contact_to )

                sql_predicates.append( 'contact_id_to = ' + str( contact_id_to ) )


            if contact_started is not None:

                contact_id_started = self._GetContactId( contact_started )

                sql_predicates.append( 'conversation_id = message_id AND contact_id_from = ' + str( contact_id_started ) )


            if min_timestamp is not None: sql_predicates.append( 'timestamp >= ' + str( min_timestamp ) )
            if max_timestamp is not None: sql_predicates.append( 'timestamp <= ' + str( max_timestamp ) )

            query_message_ids = { message_id for ( message_id, ) in self._c.execute( 'SELECT message_id FROM messages, message_destination_map USING ( message_id ) WHERE ' + ' AND '.join( sql_predicates ) + ';' ) }

            if inbox or archive:

                inbox_ids = [ message_id for ( message_id, ) in self._c.execute( 'SELECT message_id FROM message_inbox, message_destination_map USING ( message_id ) WHERE contact_id_to = ?;', ( contact_id, ) ) ]

                if inbox: query_message_ids.intersection_update( inbox_ids )
                elif archive: query_message_ids.difference_update( inbox_ids )


        for term in search_context.GetTermsToInclude():

            body_query_ids = [ message_id for ( message_id, ) in self._c.execute( 'SELECT docid FROM message_bodies WHERE body MATCH ?;', ( term, ) ) ]
            subject_query_ids = [ message_id for ( message_id, ) in self._c.execute( 'SELECT docid FROM conversation_subjects WHERE subject MATCH ?;', ( term, ) ) ]

            query_message_ids.intersection_update( body_query_ids + subject_query_ids )


        for term in search_context.GetTermsToExclude():

            body_query_ids = [ message_id for ( message_id, ) in self._c.execute( 'SELECT docid FROM message_bodies WHERE body MATCH ?;', ( term, ) ) ]
            subject_query_ids = [ message_id for ( message_id, ) in self._c.execute( 'SELECT docid FROM conversation_subjects WHERE subject MATCH ?;', ( term, ) ) ]

            query_message_ids.difference_update( body_query_ids + subject_query_ids )


        conversations = self._GetConversations( search_context, query_message_ids )

        self.pub_after_commit( 'message_query_done', query_key, conversations )


    def _DoStatusNumInbox( self ):

        convo_ids = { id for ( id, ) in self._c.execute( 'SELECT conversation_id FROM messages, message_inbox USING ( message_id );' ) }

        num_inbox = len( convo_ids )

        if num_inbox == 0: inbox_string = 'message inbox empty'
        else: inbox_string = str( num_inbox ) + ' in message inbox'

        self.pub_after_commit( 'inbox_status', inbox_string )


    def _DraftMessage( self, draft_message ):

        ( draft_key, conversation_key, subject, contact_from, contact_names_to, recipients_visible, body, attachment_hashes ) = draft_message.GetInfo()

        old_message_id = self._GetMessageId( draft_key )

        self._c.execute( 'DELETE FROM message_keys WHERE message_id = ?;', ( old_message_id, ) )
        self._c.execute( 'DELETE FROM message_bodies WHERE docid = ?;', ( old_message_id, ) )
        self._c.execute( 'DELETE FROM conversation_subjects WHERE docid = ?;', ( old_message_id, ) )

        message_id = self._GetMessageId( draft_key )

        conversation_id = self._GetConversationId( conversation_key, subject )

        contact_id_from = self._GetContactId( contact_from )

        self._c.execute( 'INSERT INTO messages ( conversation_id, message_id, contact_id_from, timestamp ) VALUES ( ?, ?, ?, ? );', ( conversation_id, message_id, contact_id_from, None ) )

        self._c.execute( 'INSERT INTO message_bodies ( docid, body ) VALUES ( ?, ? );', ( message_id, body ) )

        status_id = self._GetStatusId( 'draft' )

        contact_ids_to = [ self._GetContactId( contact_name_to ) for contact_name_to in contact_names_to ]

        self._c.executemany( 'INSERT INTO message_destination_map ( message_id, contact_id_to, status_id ) VALUES ( ?, ?, ? );', [ ( message_id, contact_id_to, status_id ) for contact_id_to in contact_ids_to ] )

        self._c.execute( 'INSERT INTO message_drafts ( message_id, recipients_visible ) VALUES ( ?, ? );', ( message_id, recipients_visible ) )

        hash_ids = self._GetHashIds( attachment_hashes )

        self._c.executemany( 'INSERT INTO message_attachments ( message_id, hash_id ) VALUES ( ?, ? );', [ ( message_id, hash_id ) for hash_id in hash_ids ] )

        self.pub_after_commit( 'draft_saved', draft_key, draft_message )


    def _FlushMessageStatuses( self ):

        incoming_message_statuses = HydrusData.BuildKeyToListDict( [ ( message_id, ( contact_key, status_id ) ) for ( message_id, contact_key, status_id ) in self._c.execute( 'SELECT message_id, contact_key, status_id FROM incoming_message_statuses, messages USING ( message_id );' ) ] )

        for ( message_id, status_infos ) in incoming_message_statuses.items():

            for ( contact_key, status_id ) in status_infos:

                try:

                    contact_id_to = self._GetContactId( contact_key )

                    self._c.execute( 'INSERT OR REPLACE INTO message_destination_map ( message_id, contact_id_to, status_id ) VALUES ( ?, ?, ? );', ( message_id, contact_id_to, status_id ) )

                except: pass


            self._c.execute( 'DELETE FROM incoming_message_statuses WHERE message_id = ?;', ( message_id, ) )

            message_key = self._GetMessageKey( message_id )

            status_updates = [ ( contact_key, self._GetStatus( status_id ) ) for ( contact_key, status_id ) in status_infos ]

            self.pub_after_commit( 'message_statuses_data', message_key, status_updates )
            self.pub_after_commit( 'message_statuses_gui', message_key, status_updates )


    def _GetAutocompleteContacts( self, half_complete_name, name_to_exclude = None ):

        # expand this later to do groups as well

        names = [ name for ( name, ) in self._c.execute( 'SELECT name FROM contacts WHERE name LIKE ? AND name != ? AND public_key NOTNULL;', ( half_complete_name + '%', 'Anonymous' ) ) ]

        if name_to_exclude is not None: names = [ name for name in names if name != name_to_exclude ]

        return names


    def _GetContact( self, parameter ):

        if type( parameter ) == int: ( public_key, name, host, port ) = self._c.execute( 'SELECT public_key, name, host, port FROM contacts WHERE contact_id = ?;', ( parameter, ) ).fetchone()
        elif type( parameter ) in ( str, unicode ):
            try: ( public_key, name, host, port ) = self._c.execute( 'SELECT public_key, name, host, port FROM contacts WHERE contact_key = ?;', ( sqlite3.Binary( parameter ), ) ).fetchone()
            except: ( public_key, name, host, port ) = self._c.execute( 'SELECT public_key, name, host, port FROM contacts WHERE name = ?;', ( parameter, ) ).fetchone()

        return ClientConstantsMessages.Contact( public_key, name, host, port )


    def _GetContactId( self, parameter ):

        if type( parameter ) in ( str, unicode ):

            if parameter == 'Anonymous': return 1

            try: ( contact_id, ) = self._c.execute( 'SELECT contact_id FROM contacts WHERE contact_key = ?;', ( sqlite3.Binary( parameter ), ) ).fetchone()
            except: ( contact_id, ) = self._c.execute( 'SELECT contact_id FROM contacts WHERE name = ?;', ( parameter, ) ).fetchone()

        elif type( parameter ) == int: ( contact_id, ) = self._c.execute( 'SELECT contact_id FROM contacts, message_depots USING ( contact_id ) WHERE service_id = ?;', ( parameter, ) ).fetchone()
        elif type( parameter ) == ClientConstantsMessages.Contact:

            contact_key = parameter.GetContactKey()

            name = parameter.GetName()

            if name == 'Anonymous': return 1

            if contact_key is not None:

                result = self._c.execute( 'SELECT contact_id FROM contacts WHERE contact_key = ?;', ( sqlite3.Binary( contact_key ), ) ).fetchone()

                if result is None:

                    # we have a new contact from an outside source!
                    # let's generate a name that'll fit into the db

                    while self._c.execute( 'SELECT 1 FROM contacts WHERE name = ?;', ( name, ) ).fetchone() is not None: name += str( random.randint( 0, 9 ) )


            else:

                # one of our user-entered contacts that doesn't have a public key yet

                result = self._c.execute( 'SELECT contact_id FROM contacts WHERE name = ?;', ( name, ) ).fetchone()


            if result is None:

                public_key = parameter.GetPublicKey()
                ( host, port ) = parameter.GetAddress()

                if public_key is not None: contact_key = sqlite3.Binary( contact_key )

                self._c.execute( 'INSERT INTO contacts ( contact_key, public_key, name, host, port ) VALUES ( ?, ?, ?, ?, ? );', ( contact_key, public_key, name, host, port ) )

                contact_id = self._c.lastrowid

            else: ( contact_id, ) = result


        return contact_id


    def _GetContactIdsToContacts( self, contact_ids ): return { contact_id : ClientConstantsMessages.Contact( public_key, name, host, port ) for ( contact_id, public_key, name, host, port ) in self._c.execute( 'SELECT contact_id, public_key, name, host, port FROM contacts WHERE contact_id IN ' + HydrusData.SplayListForDB( contact_ids ) + ';' ) }

    def _GetContactNames( self ): return [ name for ( name, ) in self._c.execute( 'SELECT name FROM contacts;' ) ]

    def _GetConversations( self, search_context, query_message_ids ):

        system_predicates = search_context.GetSystemPredicates()

        conversation_ids = { conversation_id for ( conversation_id, ) in self._c.execute( 'SELECT conversation_id FROM messages WHERE message_id IN ' + HydrusData.SplayListForDB( query_message_ids ) + ';' ) }

        splayed_conversation_ids = HydrusData.SplayListForDB( conversation_ids )

        conversation_infos = self._c.execute( 'SELECT message_id, message_key, subject FROM message_keys, conversation_subjects ON message_id = conversation_subjects.docid WHERE message_id IN ' + splayed_conversation_ids + ';' ).fetchall()

        conversation_ids_to_message_infos = HydrusData.BuildKeyToListDict( [ ( conversation_id, ( message_id, contact_id_from, timestamp, body ) ) for ( conversation_id, message_id, contact_id_from, timestamp, body ) in self._c.execute( 'SELECT conversation_id, message_id, contact_id_from, timestamp, body FROM messages, message_bodies ON message_id = message_bodies.docid WHERE conversation_id IN ' + splayed_conversation_ids + ' ORDER BY timestamp ASC;' ) ] )

        message_ids = []
        contact_ids = set()

        for message_infos in conversation_ids_to_message_infos.values():

            message_ids.extend( [ message_id for ( message_id, contact_id_from, timestamp, body ) in message_infos ] )
            contact_ids.update( [ contact_id_from for ( message_id, contact_id_from, timestamp, body ) in message_infos ] )


        message_ids_to_message_keys = self._GetMessageIdsToMessageKeys( message_ids )

        splayed_message_ids = HydrusData.SplayListForDB( message_ids )

        message_ids_to_destination_ids = HydrusData.BuildKeyToListDict( [ ( message_id, ( contact_id_to, status_id ) ) for ( message_id, contact_id_to, status_id ) in self._c.execute( 'SELECT message_id, contact_id_to, status_id FROM message_destination_map WHERE message_id IN ' + splayed_message_ids + ';' ) ] )

        messages_ids_to_recipients_visible = { message_id : recipients_visible for ( message_id, recipients_visible ) in self._c.execute( 'SELECT message_id, recipients_visible FROM message_drafts;' ) }

        status_ids = set()

        for destination_ids in message_ids_to_destination_ids.values():

            contact_ids.update( [ contact_id_to for ( contact_id_to, status_id ) in destination_ids ] )
            status_ids.update( [ status_id for ( contact_id_to, status_id ) in destination_ids ] )


        contact_ids_to_contacts = self._GetContactIdsToContacts( contact_ids )
        status_ids_to_statuses = self._GetStatusIdsToStatuses( status_ids )

        message_ids_to_hash_ids = HydrusData.BuildKeyToListDict( self._c.execute( 'SELECT message_id, hash_id FROM message_attachments WHERE message_id IN ' + splayed_message_ids + ';' ).fetchall() )

        hash_ids = set()

        for sub_hash_ids in message_ids_to_hash_ids.values(): hash_ids.update( sub_hash_ids )

        hash_ids_to_hashes = self._GetHashIdsToHashes( hash_ids )

        identity = search_context.GetIdentity()

        inbox_ids = { message_id for ( message_id, ) in self._c.execute( 'SELECT message_id FROM message_inbox;' ) }

        conversations = []

        for ( conversation_id, conversation_key, subject ) in conversation_infos:

            messages = []
            drafts = []

            can_add = False

            for ( message_id, contact_id_from, timestamp, body ) in conversation_ids_to_message_infos[ conversation_id ]:

                message_key = message_ids_to_message_keys[ message_id ]

                contact_from = contact_ids_to_contacts[ contact_id_from ]

                attachment_hashes = [ hash_ids_to_hashes[ hash_id ] for hash_id in message_ids_to_hash_ids[ message_id ] ]

                if system_predicates.Ok( len( attachment_hashes ) ): can_add = True

                attachment_hashes.sort()

                destination_ids = message_ids_to_destination_ids[ message_id ]

                if message_id in messages_ids_to_recipients_visible:

                    # this is a draft

                    contact_names_to = [ contact_ids_to_contacts[ contact_id_to ].GetName() for ( contact_id_to, status_id ) in destination_ids ]

                    recipients_visible = messages_ids_to_recipients_visible[ message_id ]

                    drafts.append( ClientConstantsMessages.DraftMessage( message_key, conversation_key, subject, contact_from, contact_names_to, recipients_visible, body, attachment_hashes ) )

                else:

                    inbox = message_id in inbox_ids

                    destinations = [ ( contact_ids_to_contacts[ contact_id_to ], status_ids_to_statuses[ status_id ] ) for ( contact_id_to, status_id ) in destination_ids ]

                    messages.append( ClientConstantsMessages.Message( message_key, contact_from, destinations, timestamp, body, attachment_hashes, inbox ) )


            if can_add: conversations.append( ClientConstantsMessages.Conversation( identity, conversation_key, subject, messages, drafts, search_context ) )


        return conversations


    def _GetConversationId( self, conversation_key, subject ):

        result = self._c.execute( 'SELECT message_id FROM message_keys, conversation_subjects ON message_id = conversation_subjects.docid WHERE message_key = ?;', ( sqlite3.Binary( conversation_key ), ) ).fetchone()

        if result is None:

            conversation_id = self._GetMessageId( conversation_key )

            self._c.execute( 'INSERT INTO conversation_subjects ( docid, subject ) VALUES ( ?, ? );', ( conversation_id, subject ) )

        else: ( conversation_id, ) = result

        return conversation_id


    def _GetIdentities( self ):

        my_identities = [ ClientConstantsMessages.Contact( public_key, name, host, port ) for ( public_key, name, host, port ) in self._c.execute( 'SELECT public_key, name, host, port FROM contacts, message_depots USING ( contact_id ) ORDER BY name ASC;' ) ]

        return my_identities + [ self._GetContact( 'Anonymous' ) ]


    def _GetIdentitiesAndContacts( self ):

        contacts_info = self._c.execute( 'SELECT contact_id, public_key, name, host, port FROM contacts ORDER BY name ASC;' ).fetchall()

        identity_ids = { contact_id for ( contact_id, ) in self._c.execute( 'SELECT contact_id FROM message_depots;' ) }

        identities = [ ClientConstantsMessages.Contact( public_key, name, host, port ) for ( contact_id, public_key, name, host, port ) in contacts_info if contact_id in identity_ids ]
        contacts = [ ClientConstantsMessages.Contact( public_key, name, host, port ) for ( contact_id, public_key, name, host, port ) in contacts_info if contact_id not in identity_ids and name != 'Anonymous' ]

        contact_contact_ids = [ contact_id for ( contact_id, public_key, name, host, port ) in contacts_info if contact_id not in identity_ids and name != 'Anonymous' ]

        deletable_names = { name for ( name, ) in self._c.execute( 'SELECT name FROM contacts WHERE contact_id IN ' + HydrusData.SplayListForDB( contact_contact_ids ) + ' AND NOT EXISTS ( SELECT 1 FROM message_destination_map WHERE contact_id_to = contact_id ) AND NOT EXISTS ( SELECT 1 FROM messages WHERE contact_id_from = contact_id );' ) }

        return ( identities, contacts, deletable_names )


    def _GetMessageId( self, message_key ):

        result = self._c.execute( 'SELECT message_id FROM message_keys WHERE message_key = ?;', ( sqlite3.Binary( message_key ), ) ).fetchone()

        if result is None:

            self._c.execute( 'INSERT INTO message_keys ( message_key ) VALUES ( ? );', ( sqlite3.Binary( message_key ), ) )

            message_id = self._c.lastrowid

        else: ( message_id, ) = result

        return message_id


    def _GetMessageIds( self, message_keys ):

        message_ids = []

        if type( message_keys ) == type( set() ): message_keys = list( message_keys )

        for i in range( 0, len( message_keys ), 250 ): # there is a limit on the number of parameterised variables in sqlite, so only do a few at a time

            message_keys_subset = message_keys[ i : i + 250 ]

            message_ids.extend( [ message_id for ( message_id, ) in self._c.execute( 'SELECT message_id FROM message_keys WHERE message_key IN (' + ','.join( '?' * len( message_keys_subset ) ) + ');', [ sqlite3.Binary( message_key ) for message_key in message_keys_subset ] ) ] )


        if len( message_keys ) > len( message_ids ):

            if len( set( message_keys ) ) > len( message_ids ):

                # must be some new messages the db has not seen before, so let's generate them as appropriate

                message_ids = self._GetMessageIds( message_keys )


        return message_ids


    def _GetMessageIdsToMessages( self, message_ids ): return { message_id : message for ( message_id, message ) in self._c.execute( 'SELECT message_id, message FROM messages WHERE message_id IN ' + HydrusData.SplayListForDB( message_ids ) + ';' ) }

    def _GetMessageIdsToMessageKeys( self, message_ids ): return { message_id : message_key for ( message_id, message_key ) in self._c.execute( 'SELECT message_id, message_key FROM message_keys WHERE message_id IN ' + HydrusData.SplayListForDB( message_ids ) + ';' ) }

    def _GetMessageKey( self, message_id ):

        result = self._c.execute( 'SELECT message_key FROM message_keys WHERE message_id = ?;', ( message_id, ) ).fetchone()

        if result is None: raise Exception( 'Message key error in database' )

        ( message_key, ) = result

        return message_key


    def _GetMessageKeysToDownload( self, service_key ):

        service_id = self._GetServiceId( service_key )

        message_keys = [ message_key for ( message_key, ) in self._c.execute( 'SELECT message_key FROM message_downloads, message_keys USING ( message_id ) WHERE service_id = ?;', ( service_id, ) ) ]

        return message_keys


    def _GetMessageSystemPredicates( self, identity ):

        name = identity.GetName()

        is_anon = name == 'Anonymous'

        additional_predicate = ''

        if name != 'Anonymous':

            service = self._GetService( identity )

            if not service.ReceivesAnon(): additional_predicate = 'contact_id_from != 1 AND '


        contact_id = self._GetContactId( name )

        unread_status_id = self._GetStatusId( 'sent' )

        #service_info = self._GetServiceInfoSpecific( service_id, service_type, { HC.SERVICE_INFO_NUM_CONVERSATIONS, HC.SERVICE_INFO_NUM_INBOX, HC.SERVICE_INFO_NUM_UNREAD, HC.SERVICE_INFO_NUM_DRAFTS } )

        ( num_conversations, ) = self._c.execute( 'SELECT COUNT( DISTINCT conversation_id ) FROM messages, message_destination_map USING ( message_id ) WHERE ' + additional_predicate + '( contact_id_from = ? OR contact_id_to = ? );', ( contact_id, contact_id ) ).fetchone()
        ( num_inbox, ) = self._c.execute( 'SELECT COUNT( DISTINCT conversation_id ) FROM message_destination_map, ( messages, message_inbox USING ( message_id ) ) USING ( message_id ) WHERE ' + additional_predicate + 'contact_id_to = ?;', ( contact_id, ) ).fetchone()
        ( num_drafts, ) = self._c.execute( 'SELECT COUNT( DISTINCT conversation_id ) FROM messages, message_drafts USING ( message_id ) WHERE contact_id_from = ?;', ( contact_id, ) ).fetchone()
        ( num_unread, ) = self._c.execute( 'SELECT COUNT( DISTINCT conversation_id ) FROM messages, message_destination_map USING ( message_id ) WHERE ' + additional_predicate + 'contact_id_to = ? AND status_id = ?;', ( contact_id, unread_status_id ) ).fetchone()

        predicates = []

        # anon has no inbox, no received mail; only sent mail

        predicates.append( ( u'system:everything', num_conversations ) )
        if not is_anon:
            predicates.append( ( u'system:inbox', num_inbox ) )
            predicates.append( ( u'system:archive', num_conversations - num_inbox ) )
            predicates.append( ( u'system:unread', num_unread ) )
        predicates.append( ( u'system:drafts', num_drafts ) )
        if not is_anon:
            predicates.append( ( u'system:started_by', None ) )
            predicates.append( ( u'system:from', None ) )
        predicates.append( ( u'system:to', None ) )
        predicates.append( ( u'system:age', None ) )
        predicates.append( ( u'system:numattachments', None ) )
        # we can add more later

        return predicates


    def _GetMessagesToSend( self ):

        status_id = self._GetStatusId( 'pending' )

        message_id_to_contact_ids = HydrusData.BuildKeyToListDict( self._c.execute( 'SELECT message_id, contact_id_to FROM message_destination_map WHERE status_id = ?;', ( status_id, ) ) )

        messages_to_send = [ ( self._GetMessageKey( message_id ), [ self._GetContact( contact_id_to ) for contact_id_to in contact_ids_to ] ) for ( message_id, contact_ids_to ) in message_id_to_contact_ids.items() ]

        return messages_to_send


    def _GetStatus( self, status_id ):

        result = self._c.execute( 'SELECT status FROM statuses WHERE status_id = ?;', ( status_id, ) ).fetchone()

        if result is None: raise Exception( 'Status error in database' )

        ( status, ) = result

        return status


    def _GetStatusId( self, status ):

        result = self._c.execute( 'SELECT status_id FROM statuses WHERE status = ?;', ( status, ) ).fetchone()

        if result is None:

            self._c.execute( 'INSERT INTO statuses ( status ) VALUES ( ? );', ( status, ) )

            status_id = self._c.lastrowid

        else: ( status_id, ) = result

        return status_id


    def _GetStatusIdsToStatuses( self, status_ids ): return { status_id : status for ( status_id, status ) in self._c.execute( 'SELECT status_id, status FROM statuses WHERE status_id IN ' + HydrusData.SplayListForDB( status_ids ) + ';' ) }

    def _GetTransportMessage( self, message_key ):

        message_id = self._GetMessageId( message_key )

        ( conversation_id, contact_id_from, timestamp ) = self._c.execute( 'SELECT conversation_id, contact_id_from, timestamp FROM messages WHERE message_id = ?;', ( message_id, ) ).fetchone()

        contact_ids_to = [ contact_id_to for ( contact_id_to, ) in self._c.execute( 'SELECT contact_id_to FROM message_destination_map WHERE message_id = ?;', ( message_id, ) ) ]

        ( subject, ) = self._c.execute( 'SELECT subject FROM conversation_subjects WHERE docid = ?;', ( conversation_id, ) ).fetchone()

        ( body, ) = self._c.execute( 'SELECT body FROM message_bodies WHERE docid = ?;', ( message_id, ) ).fetchone()

        attachment_hashes = [ hash for ( hash, ) in self._c.execute( 'SELECT hash FROM message_attachments, hashes USING ( hash_id ) WHERE message_id = ?;', ( message_id, ) ) ]

        attachment_hashes.sort()

        files = []

        client_files_manager = self._controller.GetClientFilesManager()

        for hash in attachment_hashes:

            path = client_files_manager.GetFilePath( hash )

            with open( path, 'rb' ) as f: file = f.read()

            files.append( file )


        conversation_key = self._GetMessageKey( conversation_id )

        contact_from = self._GetContact( contact_id_from )

        contacts_to = [ self._GetContact( contact_id_to ) for contact_id_to in contact_ids_to ]

        if contact_from.GetName() == 'Anonymous':

            contact_from = None
            message_depot = None
            private_key = None

        else:

            message_depot = self._GetService( contact_from )
            private_key = message_depot.GetPrivateKey()


        if conversation_key == message_key: conversation_key = None

        message = HydrusMessageHandling.Message( conversation_key, contact_from, contacts_to, subject, body, timestamp, files = files, private_key = private_key )

        return message


    def _GetTransportMessagesFromDraft( self, draft_message ):

        ( draft_key, conversation_key, subject, contact_from, contact_names_to, recipients_visible, body, attachment_hashes ) = draft_message.GetInfo()

        ( xml, html ) = yaml.safe_load( body )

        body = html

        files = []

        client_files_manager = self._controller.GetClientFilesManager()

        for hash in attachment_hashes:

            path = client_files_manager.GetFilePath( hash )

            with open( path, 'rb' ) as f: file = f.read()

            files.append( file )


        contact_id_from = self._GetContactId( contact_from )

        if contact_from.GetName() == 'Anonymous':

            contact_from = None
            message_depot = None
            private_key = None

        else:

            message_depot = self._GetService( contact_from )
            private_key = message_depot.GetPrivateKey()


        timestamp = HydrusData.GetNow()

        contacts_to = [ self._GetContact( contact_name_to ) for contact_name_to in contact_names_to ]

        if conversation_key == draft_key: conversation_key = None

        if recipients_visible: messages = [ HydrusMessageHandling.Message( conversation_key, contact_from, contacts_to, subject, body, timestamp, files = files, private_key = private_key ) ]
        else: messages = [ HydrusMessageHandling.Message( conversation_key, contact_from, [ contact_to ], subject, body, timestamp, files = files, private_key = private_key ) for contact_to in contacts_to ]

        return messages


    def _InboxConversation( self, conversation_key ):

        conversation_id = self._GetMessageId( conversation_key )

        inserts = self._c.execute( 'SELECT message_id FROM messages WHERE conversation_id = ?;', ( conversation_id, ) ).fetchall()

        self._c.executemany( 'INSERT OR IGNORE INTO message_inbox ( message_id ) VALUES ( ? );', inserts )

        self.pub_after_commit( 'inbox_conversation_data', conversation_key )
        self.pub_after_commit( 'inbox_conversation_gui', conversation_key )

        self._DoStatusNumInbox()


    def _UpdateContacts( self, edit_log ):

        for ( action, details ) in edit_log:

            if action == HC.ADD:

                contact = details

                self._AddContact( contact )

            elif action == HC.DELETE:

                name = details

                result = self._c.execute( 'SELECT 1 FROM contacts WHERE name = ? AND NOT EXISTS ( SELECT 1 FROM message_destination_map WHERE contact_id_to = contact_id ) AND NOT EXISTS ( SELECT 1 FROM messages WHERE contact_id_from = contact_id );', ( name, ) ).fetchone()

                if result is not None: self._c.execute( 'DELETE FROM contacts WHERE name = ?;', ( name, ) )

            elif action == HC.EDIT:

                ( old_name, contact ) = details

                try:

                    contact_id = self._GetContactId( old_name )

                    ( public_key, name, host, port ) = contact.GetInfo()

                    contact_key = contact.GetContactKey()

                    if public_key is not None: contact_key = sqlite3.Binary( contact_key )

                    self._c.execute( 'UPDATE contacts SET contact_key = ?, public_key = ?, name = ?, host = ?, port = ? WHERE contact_id = ?;', ( contact_key, public_key, name, host, port, contact_id ) )

                except: pass


        self.pub_after_commit( 'notify_new_contacts' )


    def _UpdateMessageStatuses( self, message_key, status_updates ):

        message_id = self._GetMessageId( message_key )

        updates = []

        for ( contact_key, status ) in status_updates:

            contact_id = self._GetContactId( contact_key )
            status_id = self._GetStatusId( status )

            updates.append( ( contact_id, status_id ) )


        self._c.executemany( 'UPDATE message_destination_map SET status_id = ? WHERE contact_id_to = ? AND message_id = ?;', [ ( status_id, contact_id, message_id ) for ( contact_id, status_id ) in updates ] )

        self.pub_after_commit( 'message_statuses_data', message_key, status_updates )
        self.pub_after_commit( 'message_statuses_gui', message_key, status_updates )
        self.pub_after_commit( 'notify_check_messages' )

    '''

def GenerateCombinedFilesMappingsCacheTableName( service_id ):

    return 'external_caches.combined_files_ac_cache_' + str( service_id )

def GenerateMappingsTableNames( service_id ):

    suffix = str( service_id )

    current_mappings_table_name = 'external_mappings.current_mappings_' + suffix

    deleted_mappings_table_name = 'external_mappings.deleted_mappings_' + suffix

    pending_mappings_table_name = 'external_mappings.pending_mappings_' + suffix

    petitioned_mappings_table_name = 'external_mappings.petitioned_mappings_' + suffix

    return ( current_mappings_table_name, deleted_mappings_table_name, pending_mappings_table_name, petitioned_mappings_table_name )

def GenerateSpecificMappingsCacheTableNames( file_service_id, tag_service_id ):

    suffix = str( file_service_id ) + '_' + str( tag_service_id )

    cache_files_table_name = 'external_caches.specific_files_cache_' + suffix

    cache_current_mappings_table_name = 'external_caches.specific_current_mappings_cache_' + suffix

    cache_pending_mappings_table_name = 'external_caches.specific_pending_mappings_cache_' + suffix

    ac_cache_table_name = 'external_caches.specific_ac_cache_' + suffix

    return ( cache_files_table_name, cache_current_mappings_table_name, cache_pending_mappings_table_name, ac_cache_table_name )

class DB( HydrusDB.HydrusDB ):

    READ_WRITE_ACTIONS = [ 'service_info', 'system_predicates' ]

    def __init__( self, controller, db_dir, db_name, no_wal = False ):

        self._updates_dir = os.path.join( db_dir, 'client_updates' )

        self._initial_messages = []

        HydrusDB.HydrusDB.__init__( self, controller, db_dir, db_name, no_wal = no_wal )


    def _AddFilesInfo( self, rows, overwrite = False ):

        if overwrite:

            insert_phrase = 'REPLACE INTO'

        else:

            insert_phrase = 'INSERT OR IGNORE INTO'


        # hash_id, size, mime, width, height, duration, num_frames, num_words
        self._c.executemany( insert_phrase + ' files_info VALUES ( ?, ?, ?, ?, ?, ?, ?, ? );', rows )


    def _AddFiles( self, service_id, rows ):

        hash_ids = { row[0] for row in rows }

        existing_hash_ids = { hash_id for ( hash_id, ) in self._c.execute( 'SELECT hash_id FROM current_files WHERE service_id = ? AND hash_id IN ' + HydrusData.SplayListForDB( hash_ids ) + ';', ( service_id, ) ) }

        valid_hash_ids = hash_ids.difference( existing_hash_ids )

        if len( valid_hash_ids ) > 0:

            valid_rows = [ ( hash_id, timestamp ) for ( hash_id, timestamp ) in rows if hash_id in valid_hash_ids ]

            splayed_valid_hash_ids = HydrusData.SplayListForDB( valid_hash_ids )

            # insert the files

            self._c.executemany( 'INSERT OR IGNORE INTO current_files VALUES ( ?, ?, ? );', ( ( service_id, hash_id, timestamp ) for ( hash_id, timestamp ) in valid_rows ) )

            self._c.execute( 'DELETE FROM file_transfers WHERE service_id = ? AND hash_id IN ' + splayed_valid_hash_ids + ';', ( service_id, ) )

            info = self._c.execute( 'SELECT hash_id, size, mime FROM files_info WHERE hash_id IN ' + splayed_valid_hash_ids + ';' ).fetchall()

            num_files = len( valid_hash_ids )
            delta_size = sum( ( size for ( hash_id, size, mime ) in info ) )
            num_inbox = len( valid_hash_ids.intersection( self._inbox_hash_ids ) )

            service_info_updates = []

            service_info_updates.append( ( delta_size, service_id, HC.SERVICE_INFO_TOTAL_SIZE ) )
            service_info_updates.append( ( num_files, service_id, HC.SERVICE_INFO_NUM_FILES ) )
            service_info_updates.append( ( num_inbox, service_id, HC.SERVICE_INFO_NUM_INBOX ) )

            # now do special stuff

            service = self._GetService( service_id )

            service_type = service.GetServiceType()

            # remove any records of previous deletion

            if service_id == self._combined_local_file_service_id or service_type == HC.FILE_REPOSITORY:

                self._c.execute( 'DELETE FROM deleted_files WHERE service_id = ? AND hash_id IN ' + splayed_valid_hash_ids + ';', ( service_id, ) )

                num_deleted = self._GetRowCount()

                service_info_updates.append( ( -num_deleted, service_id, HC.SERVICE_INFO_NUM_DELETED_FILES ) )


            # if we are adding to a local file domain, remove any from the trash and add to combined local file service if needed

            if service_type == HC.LOCAL_FILE_DOMAIN:

                self._DeleteFiles( self._trash_service_id, valid_hash_ids )

                self._AddFiles( self._combined_local_file_service_id, valid_rows )


            # if we track tags for this service, update the a/c cache

            if service_type in HC.AUTOCOMPLETE_CACHE_SPECIFIC_FILE_SERVICES:

                tag_service_ids = self._GetServiceIds( HC.TAG_SERVICES )

                for tag_service_id in tag_service_ids:

                    self._CacheSpecificMappingsAddFiles( service_id, tag_service_id, valid_hash_ids )


            # push the service updates, done

            self._c.executemany( 'UPDATE service_info SET info = info + ? WHERE service_id = ? AND info_type = ?;', service_info_updates )


    def _AddHydrusSession( self, service_key, session_key, expires ):

        service_id = self._GetServiceId( service_key )

        self._c.execute( 'REPLACE INTO hydrus_sessions ( service_id, session_key, expiry ) VALUES ( ?, ?, ? );', ( service_id, sqlite3.Binary( session_key ), expires ) )


    def _AddService( self, service_key, service_type, name, info ):

        if service_type == HC.LOCAL_BOORU:

            current_time_struct = time.gmtime()

            ( current_year, current_month ) = ( current_time_struct.tm_year, current_time_struct.tm_mon )

            if 'used_monthly_data' not in info: info[ 'used_monthly_data' ] = 0
            if 'max_monthly_data' not in info: info[ 'max_monthly_data' ] = None
            if 'used_monthly_requests' not in info: info[ 'used_monthly_requests' ] = 0
            if 'current_data_month' not in info: info[ 'current_data_month' ] = ( current_year, current_month )
            if 'port' not in info: info[ 'port' ] = None
            if 'upnp' not in info: info[ 'upnp' ] = None


        if service_type in HC.REMOTE_SERVICES:

            if 'last_error' not in info: info[ 'last_error' ] = 0


        if service_type in HC.RESTRICTED_SERVICES:

            if 'account' not in info:

                account = HydrusData.GetUnknownAccount()

                account.MakeStale()

                info[ 'account' ] = account

                self.pub_after_commit( 'permissions_are_stale' )


        if service_type in HC.TAG_SERVICES:

            if 'tag_archive_sync' not in info: info[ 'tag_archive_sync' ] = {}


        if service_type in HC.REPOSITORIES:

            update_dir = ClientFiles.GetExpectedUpdateDir( service_key )

            HydrusPaths.MakeSureDirectoryExists( update_dir )

            if 'first_timestamp' not in info:

                info[ 'first_timestamp' ] = None


            if 'next_download_timestamp' not in info:

                info[ 'next_download_timestamp' ] = 0


            if 'next_processing_timestamp' not in info:

                info[ 'next_processing_timestamp' ] = 0


            info[ 'paused' ] = False


        result = self._c.execute( 'SELECT 1 FROM services WHERE name = ?;', ( name, ) ).fetchone()

        while result is not None:

            name += str( random.randint( 0, 9 ) )

            result = self._c.execute( 'SELECT 1 FROM services WHERE name = ?;', ( name, ) ).fetchone()


        self._c.execute( 'INSERT INTO services ( service_key, service_type, name, info ) VALUES ( ?, ?, ?, ? );', ( sqlite3.Binary( service_key ), service_type, name, info ) )

        service_id = self._c.lastrowid

        if service_type in HC.TAG_SERVICES:

            ( current_mappings_table_name, deleted_mappings_table_name, pending_mappings_table_name, petitioned_mappings_table_name ) = GenerateMappingsTableNames( service_id )

            current_mappings_table_simple_name = current_mappings_table_name.split( '.' )[1]
            deleted_mappings_table_simple_name = deleted_mappings_table_name.split( '.' )[1]
            pending_mappings_table_simple_name = pending_mappings_table_name.split( '.' )[1]
            petitioned_mappings_table_simple_name = petitioned_mappings_table_name.split( '.' )[1]

            self._c.execute( 'CREATE TABLE IF NOT EXISTS ' + current_mappings_table_name + ' ( namespace_id INTEGER, tag_id INTEGER, hash_id INTEGER, PRIMARY KEY( namespace_id, tag_id, hash_id ) ) WITHOUT ROWID;' )
            self._c.execute( 'CREATE INDEX IF NOT EXISTS ' + current_mappings_table_name + '_tag_id_index ON ' + current_mappings_table_simple_name + ' ( tag_id );' )
            self._c.execute( 'CREATE INDEX IF NOT EXISTS ' + current_mappings_table_name + '_hash_id_index ON ' + current_mappings_table_simple_name + ' ( hash_id );' )

            self._c.execute( 'CREATE TABLE IF NOT EXISTS ' + deleted_mappings_table_name + ' ( namespace_id INTEGER, tag_id INTEGER, hash_id INTEGER, PRIMARY KEY( namespace_id, tag_id, hash_id ) ) WITHOUT ROWID;' )
            self._c.execute( 'CREATE INDEX IF NOT EXISTS ' + deleted_mappings_table_name + '_hash_id_index ON ' + deleted_mappings_table_simple_name + ' ( hash_id );' )

            self._c.execute( 'CREATE TABLE IF NOT EXISTS ' + pending_mappings_table_name + ' ( namespace_id INTEGER, tag_id INTEGER, hash_id INTEGER, PRIMARY KEY( namespace_id, tag_id, hash_id ) ) WITHOUT ROWID;' )
            self._c.execute( 'CREATE INDEX IF NOT EXISTS ' + pending_mappings_table_name + '_tag_id_index ON ' + pending_mappings_table_simple_name + ' ( tag_id );' )
            self._c.execute( 'CREATE INDEX IF NOT EXISTS ' + pending_mappings_table_name + '_hash_id_index ON ' + pending_mappings_table_simple_name + ' ( hash_id );' )

            self._c.execute( 'CREATE TABLE IF NOT EXISTS ' + petitioned_mappings_table_name + ' ( namespace_id INTEGER, tag_id INTEGER, hash_id INTEGER, reason_id INTEGER, PRIMARY KEY( namespace_id, tag_id, hash_id, reason_id ) ) WITHOUT ROWID;' )
            self._c.execute( 'CREATE INDEX IF NOT EXISTS ' + petitioned_mappings_table_name + '_hash_id_index ON ' + petitioned_mappings_table_simple_name + ' ( hash_id );' )

            #

            self._CacheCombinedFilesMappingsGenerate( service_id )

            file_service_ids = self._GetServiceIds( HC.AUTOCOMPLETE_CACHE_SPECIFIC_FILE_SERVICES )

            for file_service_id in file_service_ids:

                self._CacheSpecificMappingsGenerate( file_service_id, service_id )


        if service_type in HC.AUTOCOMPLETE_CACHE_SPECIFIC_FILE_SERVICES:

            tag_service_ids = self._GetServiceIds( HC.TAG_SERVICES )

            for tag_service_id in tag_service_ids:

                self._CacheSpecificMappingsGenerate( service_id, tag_service_id )


    def _AddWebSession( self, name, cookies, expires ):

        self._c.execute( 'REPLACE INTO web_sessions ( name, cookies, expiry ) VALUES ( ?, ?, ? );', ( name, cookies, expires ) )


    def _AnalyzeStaleBigTables( self, stop_time = None, only_when_idle = False, force_reanalyze = False ):

        names_to_analyze = self._GetBigTableNamesToAnalyze( force_reanalyze = force_reanalyze )

        if len( names_to_analyze ) > 0:

            job_key = ClientThreading.JobKey()

            job_key.SetVariable( 'popup_title', 'database maintenance - analyzing' )

            self._controller.pub( 'message', job_key )

            random.shuffle( names_to_analyze )

            for name in names_to_analyze:

                self._controller.pub( 'splash_set_status_text', 'analyzing ' + name )
                job_key.SetVariable( 'popup_text_1', 'analyzing ' + name )

                started = HydrusData.GetNowPrecise()

                self._AnalyzeTable( name )

                time_took = HydrusData.GetNowPrecise() - started

                if time_took > 1:

                    HydrusData.Print( 'Analyzed ' + name + ' in ' + HydrusData.ConvertTimeDeltaToPrettyString( time_took ) )


                p1 = stop_time is not None and HydrusData.TimeHasPassed( stop_time )
                p2 = only_when_idle and not self._controller.CurrentlyIdle()

                if p1 or p2:

                    break


            self._c.execute( 'ANALYZE sqlite_master;' ) # this reloads the current stats into the query planner

            job_key.SetVariable( 'popup_text_1', 'done!' )

            HydrusData.Print( job_key.ToString() )

            job_key.Delete( 30 )


    def _AnalyzeTable( self, name ):

        self._c.execute( 'ANALYZE ' + name + ';' )

        ( num_rows, ) = self._c.execute( 'SELECT COUNT( * ) FROM ' + name + ';' ).fetchone()

        self._c.execute( 'DELETE FROM analyze_timestamps WHERE name = ?;', ( name, ) )

        self._c.execute( 'INSERT OR IGNORE INTO analyze_timestamps ( name, num_rows, timestamp ) VALUES ( ?, ?, ? );', ( name, num_rows, HydrusData.GetNow() ) )


    def _ArchiveFiles( self, hash_ids ):

        valid_hash_ids = [ hash_id for hash_id in hash_ids if hash_id in self._inbox_hash_ids ]

        if len( valid_hash_ids ) > 0:

            splayed_hash_ids = HydrusData.SplayListForDB( valid_hash_ids )

            self._c.execute( 'DELETE FROM file_inbox WHERE hash_id IN ' + splayed_hash_ids + ';' )

            updates = self._c.execute( 'SELECT service_id, COUNT( * ) FROM current_files WHERE hash_id IN ' + splayed_hash_ids + ' GROUP BY service_id;' ).fetchall()

            self._c.executemany( 'UPDATE service_info SET info = info - ? WHERE service_id = ? AND info_type = ?;', [ ( count, service_id, HC.SERVICE_INFO_NUM_INBOX ) for ( service_id, count ) in updates ] )

            self._inbox_hash_ids.difference_update( valid_hash_ids )


    def _Backup( self, path ):

        client_files_locations = self._GetClientFilesLocations()

        client_files_default = os.path.join( self._db_dir, 'client_files' )

        for location in client_files_locations.values():

            if not location.startswith( client_files_default ):

                HydrusData.ShowText( 'Some of your files are stored outside of ' + client_files_default + '. These files will not be backed up--please do this manually, yourself.' )

                break


        job_key = ClientThreading.JobKey( cancellable = True )

        job_key.SetVariable( 'popup_title', 'backing up db' )

        self._controller.pub( 'message', job_key )

        job_key.SetVariable( 'popup_text_1', 'closing db' )

        self._c.execute( 'COMMIT;' )

        self._CloseDBCursor()

        try:

            HydrusPaths.MakeSureDirectoryExists( path )

            for filename in self._db_filenames.values():

                job_key.SetVariable( 'popup_text_1', 'copying ' + filename )

                source = os.path.join( self._db_dir, filename )
                dest = os.path.join( path, filename )

                HydrusPaths.MirrorFile( source, dest )


            job_key.SetVariable( 'popup_text_1', 'copying files directory' )

            if os.path.exists( client_files_default ):

                HydrusPaths.MirrorTree( client_files_default, os.path.join( path, 'client_files' ) )


            job_key.SetVariable( 'popup_text_1', 'copying updates directory' )

            HydrusPaths.MirrorTree( self._updates_dir, os.path.join( path, 'client_updates' ) )

        finally:

            self._InitDBCursor()

            self._c.execute( 'BEGIN IMMEDIATE;' )


        job_key.SetVariable( 'popup_text_1', 'done!' )

        job_key.Finish()


    def _CacheCombinedFilesMappingsDrop( self, service_id ):

        ac_cache_table_name = GenerateCombinedFilesMappingsCacheTableName( service_id )

        self._c.execute( 'DROP TABLE IF EXISTS ' + ac_cache_table_name + ';' )


    def _CacheCombinedFilesMappingsGenerate( self, service_id ):

        ac_cache_table_name = GenerateCombinedFilesMappingsCacheTableName( service_id )

        self._c.execute( 'CREATE TABLE ' + ac_cache_table_name + ' ( namespace_id INTEGER, tag_id INTEGER, current_count INTEGER, pending_count INTEGER, PRIMARY KEY( namespace_id, tag_id ) ) WITHOUT ROWID;' )

        #

        ( current_mappings_table_name, deleted_mappings_table_name, pending_mappings_table_name, petitioned_mappings_table_name ) = GenerateMappingsTableNames( service_id )

        current_mappings_exist = self._c.execute( 'SELECT 1 FROM ' + current_mappings_table_name + ' LIMIT 1;' ).fetchone() is not None
        pending_mappings_exist = self._c.execute( 'SELECT 1 FROM ' + pending_mappings_table_name + ' LIMIT 1;' ).fetchone() is not None

        if current_mappings_exist or pending_mappings_exist:

            all_known_ids = self._c.execute( 'SELECT namespace_id, tag_id FROM existing_tags;' ).fetchall()

            for group_of_ids in HydrusData.SplitListIntoChunks( all_known_ids, 10000 ):

                current_counter = collections.Counter()

                if current_mappings_exist:

                    for ( namespace_id, tag_id ) in group_of_ids:

                        result = self._c.execute( 'SELECT COUNT( * ) FROM ' + current_mappings_table_name + ' WHERE namespace_id = ? AND tag_id = ?;', ( namespace_id, tag_id ) ).fetchone()

                        if result is not None:

                            ( count, ) = result

                            if count > 0:

                                current_counter[ ( namespace_id, tag_id ) ] = count


                #

                pending_counter = collections.Counter()

                if pending_mappings_exist:

                    for ( namespace_id, tag_id ) in group_of_ids:

                        result = self._c.execute( 'SELECT COUNT( * ) FROM ' + pending_mappings_table_name + ' WHERE namespace_id = ? AND tag_id = ?;', ( namespace_id, tag_id ) ).fetchone()

                        if result is not None:

                            ( count, ) = result

                            if count > 0:

                                pending_counter[ ( namespace_id, tag_id ) ] = count


                all_ids_seen = set( current_counter.keys() )
                all_ids_seen.update( pending_counter.keys() )

                count_ids = [ ( namespace_id, tag_id, current_counter[ ( namespace_id, tag_id ) ], pending_counter[ ( namespace_id, tag_id ) ] ) for ( namespace_id, tag_id ) in all_ids_seen ]

                if len( count_ids ) > 0:

                    self._CacheCombinedFilesMappingsUpdate( service_id, count_ids )


    def _CacheCombinedFilesMappingsGetAutocompleteCounts( self, service_id, namespace_ids_to_tag_ids ):

        ac_cache_table_name = GenerateCombinedFilesMappingsCacheTableName( service_id )

        results = []

        for ( namespace_id, tag_ids ) in namespace_ids_to_tag_ids.items():

            results.extend( ( ( namespace_id, tag_id, current_count, pending_count ) for ( tag_id, current_count, pending_count ) in self._c.execute( 'SELECT tag_id, current_count, pending_count FROM ' + ac_cache_table_name + ' WHERE namespace_id = ? AND tag_id IN ' + HydrusData.SplayListForDB( tag_ids ) + ';', ( namespace_id, ) ) ) )


        return results


    def _CacheCombinedFilesMappingsUpdate( self, service_id, count_ids ):

        ac_cache_table_name = GenerateCombinedFilesMappingsCacheTableName( service_id )

        self._c.executemany( 'INSERT OR IGNORE INTO ' + ac_cache_table_name + ' ( namespace_id, tag_id, current_count, pending_count ) VALUES ( ?, ?, ?, ? );', ( ( namespace_id, tag_id, 0, 0 ) for ( namespace_id, tag_id, current_delta, pending_delta ) in count_ids ) )

        self._c.executemany( 'UPDATE ' + ac_cache_table_name + ' SET current_count = current_count + ?, pending_count = pending_count + ? WHERE namespace_id = ? AND tag_id = ?;', ( ( current_delta, pending_delta, namespace_id, tag_id ) for ( namespace_id, tag_id, current_delta, pending_delta ) in count_ids ) )

        self._c.executemany( 'DELETE FROM ' + ac_cache_table_name + ' WHERE namespace_id = ? AND tag_id = ? AND current_count = ? AND pending_count = ?;', ( ( namespace_id, tag_id, 0, 0 ) for ( namespace_id, tag_id, current_delta, pending_delta ) in count_ids ) )


    def _CacheSimilarFilesAddLeaf( self, phash_id, phash ):

        result = self._c.execute( 'SELECT phash_id FROM shape_vptree WHERE parent_id IS NULL;' ).fetchone()

        if result is None:

            parent_id = None

        else:

            ( root_node_phash_id, ) = result

            ancestors_we_are_inside = []
            ancestors_we_are_outside = []

            an_ancestor_is_unbalanced = False

            next_ancestor_id = root_node_phash_id

            while next_ancestor_id is not None:

                ancestor_id = next_ancestor_id

                ( ancestor_phash, ancestor_radius, ancestor_inner_id, ancestor_inner_population, ancestor_outer_id, ancestor_outer_population ) = self._c.execute( 'SELECT phash, radius, inner_id, inner_population, outer_id, outer_population FROM shape_perceptual_hashes, shape_vptree USING ( phash_id ) WHERE phash_id = ?;', ( ancestor_id, ) ).fetchone()

                distance_to_ancestor = HydrusData.GetHammingDistance( phash, ancestor_phash )

                if ancestor_radius is None or distance_to_ancestor <= ancestor_radius:

                    ancestors_we_are_inside.append( ancestor_id )
                    ancestor_inner_population += 1
                    next_ancestor_id = ancestor_inner_id

                    if ancestor_inner_id is None:

                        self._c.execute( 'UPDATE shape_vptree SET inner_id = ?, radius = ? WHERE phash_id = ?;', ( phash_id, distance_to_ancestor, ancestor_id ) )

                        parent_id = ancestor_id


                else:

                    ancestors_we_are_outside.append( ancestor_id )
                    ancestor_outer_population += 1
                    next_ancestor_id = ancestor_outer_id

                    if ancestor_outer_id is None:

                        self._c.execute( 'UPDATE shape_vptree SET outer_id = ? WHERE phash_id = ?;', ( phash_id, ancestor_id ) )

                        parent_id = ancestor_id


                if not an_ancestor_is_unbalanced and ancestor_inner_population + ancestor_outer_population > 16:

                    larger = float( max( ancestor_inner_population, ancestor_outer_population ) )
                    smaller = float( min( ancestor_inner_population, ancestor_outer_population ) )

                    if smaller / larger < 0.5:

                        self._c.execute( 'INSERT OR IGNORE INTO shape_maintenance_branch_regen ( phash_id ) VALUES ( ? );', ( ancestor_id, ) )

                        # we only do this for the eldest ancestor, as the eventual rebalancing will affect all children

                        an_ancestor_is_unbalanced = True


            self._c.executemany( 'UPDATE shape_vptree SET inner_population = inner_population + 1 WHERE phash_id = ?;', ( ( ancestor_id, ) for ancestor_id in ancestors_we_are_inside ) )
            self._c.executemany( 'UPDATE shape_vptree SET outer_population = outer_population + 1 WHERE phash_id = ?;', ( ( ancestor_id, ) for ancestor_id in ancestors_we_are_outside ) )


        radius = None
        inner_id = None
        inner_population = 0
        outer_id = None
        outer_population = 0

        self._c.execute( 'INSERT INTO shape_vptree ( phash_id, parent_id, radius, inner_id, inner_population, outer_id, outer_population ) VALUES ( ?, ?, ?, ?, ?, ?, ? );', ( phash_id, parent_id, radius, inner_id, inner_population, outer_id, outer_population ) )


    def _CacheSimilarFilesDelete( self, hash_id, phash_ids = None ):

        if phash_ids is None:

            phash_ids = { phash_id for ( phash_id, ) in self._c.execute( 'SELECT phash_id FROM shape_perceptual_hash_map WHERE hash_id = ?;', ( hash_id, ) ) }

            self._c.execute( 'DELETE FROM shape_perceptual_hash_map WHERE hash_id = ?;', ( hash_id, ) )

        else:

            phash_ids = set( phash_ids )

            self._c.executemany( 'DELETE FROM shape_perceptual_hash_map WHERE phash_id = ? AND hash_id = ?;', ( ( phash_id, hash_id ) for phash_id in phash_ids ) )


        useful_phash_ids = { phash for ( phash, ) in self._c.execute( 'SELECT phash_id FROM shape_perceptual_hash_map WHERE phash_id IN ' + HydrusData.SplayListForDB( phash_ids ) + ';' ) }

        deletee_phash_ids = phash_ids.difference( useful_phash_ids )

        self._c.executemany( 'INSERT OR IGNORE INTO shape_maintenance_branch_regen ( phash_id ) VALUES ( ? );', ( ( phash_id, ) for phash_id in deletee_phash_ids ) )

        self._c.execute( 'DELETE FROM shape_search_cache WHERE hash_id = ?;', ( hash_id, ) )
        self._c.execute( 'DELETE FROM duplicate_pairs WHERE smaller_hash_id = ? or larger_hash_id = ?;', ( hash_id, hash_id ) )


    def _CacheSimilarFilesGenerateBranch( self, job_key, parent_id, phash_id, phash, children ):

        process_queue = [ ( parent_id, phash_id, phash, children ) ]

        insert_rows = []

        num_done = 0
        num_to_do = len( children ) + 1

        while len( process_queue ) > 0:

            job_key.SetVariable( 'popup_text_2', 'generating new branch -- ' + HydrusData.ConvertValueRangeToPrettyString( num_done, num_to_do ) )

            ( parent_id, phash_id, phash, children ) = process_queue.pop( 0 )

            if len( children ) == 0:

                inner_id = None
                inner_population = 0

                outer_id = None
                outer_population = 0

                radius = None

            else:

                children = [ ( HydrusData.GetHammingDistance( phash, child_phash ), child_id, child_phash ) for ( child_id, child_phash ) in children ]

                children.sort()

                median_index = len( children ) / 2

                median_radius = children[ median_index ][0]

                inner_children = [ ( child_id, child_phash ) for ( distance, child_id, child_phash ) in children if distance < median_radius ]
                radius_children = [ ( child_id, child_phash ) for ( distance, child_id, child_phash ) in children if distance == median_radius ]
                outer_children = [ ( child_id, child_phash ) for ( distance, child_id, child_phash ) in children if distance > median_radius ]

                if len( inner_children ) <= len( outer_children ):

                    radius = median_radius

                    inner_children.extend( radius_children )

                else:

                    radius = median_radius - 1

                    outer_children.extend( radius_children )


                inner_population = len( inner_children )
                outer_population = len( outer_children )

                ( inner_id, inner_phash ) = self._CacheSimilarFilesPopBestRootNode( inner_children ) #HydrusData.MedianPop( inner_children )

                if len( outer_children ) == 0:

                    outer_id = None

                else:

                    ( outer_id, outer_phash ) = self._CacheSimilarFilesPopBestRootNode( outer_children ) #HydrusData.MedianPop( outer_children )


            insert_rows.append( ( phash_id, parent_id, radius, inner_id, inner_population, outer_id, outer_population ) )

            if inner_id is not None:

                process_queue.append( ( phash_id, inner_id, inner_phash, inner_children ) )


            if outer_id is not None:

                process_queue.append( ( phash_id, outer_id, outer_phash, outer_children ) )


            num_done += 1


        job_key.SetVariable( 'popup_text_2', 'branch constructed, now committing' )

        self._c.executemany( 'INSERT INTO shape_vptree ( phash_id, parent_id, radius, inner_id, inner_population, outer_id, outer_population ) VALUES ( ?, ?, ?, ?, ?, ?, ? );', insert_rows )


    def _CacheSimilarFilesGetPHashId( self, phash ):

        result = self._c.execute( 'SELECT phash_id FROM shape_perceptual_hashes WHERE phash = ?;', ( sqlite3.Binary( phash ), ) ).fetchone()

        if result is None:

            self._c.execute( 'INSERT INTO shape_perceptual_hashes ( phash ) VALUES ( ? );', ( sqlite3.Binary( phash ), ) )

            phash_id = self._c.lastrowid

            self._CacheSimilarFilesAddLeaf( phash_id, phash )

        else:

            ( phash_id, ) = result


        return phash_id


    def _CacheSimilarFilesGetMaintenanceStatus( self ):

        searched_distances_to_count = collections.Counter( dict( self._c.execute( 'SELECT searched_distance, COUNT( * ) FROM shape_search_cache GROUP BY searched_distance;' ) ) )
        duplicate_types_to_count = collections.Counter( dict( self._c.execute( 'SELECT duplicate_type, COUNT( * ) FROM duplicate_pairs GROUP BY duplicate_type;' ) ) )

        ( num_phashes_to_regen, ) = self._c.execute( 'SELECT COUNT( * ) FROM shape_maintenance_phash_regen;' ).fetchone()
        ( num_branches_to_regen, ) = self._c.execute( 'SELECT COUNT( * ) FROM shape_maintenance_branch_regen;' ).fetchone()

        return ( searched_distances_to_count, duplicate_types_to_count, num_phashes_to_regen, num_branches_to_regen )


    def _CacheSimilarFilesAssociatePHashes( self, hash_id, phashes ):

        phash_ids = set()

        for phash in phashes:

            phash_id = self._CacheSimilarFilesGetPHashId( phash )

            self._c.execute( 'INSERT OR IGNORE INTO shape_perceptual_hash_map ( phash_id, hash_id ) VALUES ( ?, ? );', ( phash_id, hash_id ) )

            phash_ids.add( phash_id )


        self._c.execute( 'REPLACE INTO shape_search_cache ( hash_id, searched_distance ) VALUES ( ?, ? );', ( hash_id, None ) )

        return phash_ids


    def _CacheSimilarFilesMaintainFiles( self, job_key ):

        # this should take a cancellable job_key from the gui filter window

        hash_ids = [ hash_id for ( hash_id, ) in self._c.execute( 'SELECT hash_id FROM shape_maintenance_phash_regen;' ) ]

        # remove hash_id from the pairs cache?
        # set its search status to False, but don't remove any existing pairs

        client_files_manager = self._controller.GetClientFilesManager()

        num_to_do = len( hash_ids )

        for ( i, hash_id ) in enumerate( hash_ids ):

            ( i_paused, should_quit ) = job_key.WaitIfNeeded()

            if should_quit:

                return


            text = 'regenerating similar file metadata - ' + HydrusData.ConvertValueRangeToPrettyString( i, num_to_do )

            job_key.SetVariable( 'popup_text_1', text )
            job_key.SetVariable( 'popup_gauge_1', ( i, num_to_do ) )

            try:

                hash = self._GetHash( hash_id )
                mime = self._GetMime( hash_id )

                if mime in HC.MIMES_WE_CAN_PHASH:

                    path = client_files_manager.GetFilePath( hash, mime )

                    if mime in ( HC.IMAGE_JPEG, HC.IMAGE_PNG ):

                        try:

                            phashes = ClientImageHandling.GenerateShapePerceptualHashes( path )

                        except Exception as e:

                            HydrusData.Print( 'Could not generate phashes for ' + path )

                            HydrusData.PrintException( e )

                            phashes = []


                else:

                    phashes = []


            except HydrusExceptions.FileMissingException:

                phashes = []


            existing_phash_ids = { phash_id for ( phash_id, ) in self._c.execute( 'SELECT phash_id FROM shape_perceptual_hash_map WHERE hash_id = ?;', ( hash_id, ) ) }

            correct_phash_ids = self._CacheSimilarFilesAssociatePHashes( hash_id, phashes )

            deletee_phash_ids = existing_phash_ids.difference( correct_phash_ids )

            self._CacheSimilarFilesDelete( hash_id, deletee_phash_ids )

            self._c.execute( 'DELETE FROM shape_maintenance_phash_regen WHERE hash_id = ?;', ( hash_id, ) )


        job_key.Finish()


    def _CacheSimilarFilesMaintainTree( self, stop_time ):

        job_key = ClientThreading.JobKey( cancellable = True )

        job_key.SetVariable( 'popup_title', 'similar files metadata maintenance' )

        job_key_pubbed = False

        rebalance_phash_ids = [ phash_id for ( phash_id, ) in self._c.execute( 'SELECT phash_id FROM shape_maintenance_branch_regen;' ) ]

        num_to_do = len( rebalance_phash_ids )

        while len( rebalance_phash_ids ) > 0:

            if not job_key_pubbed:

                self._controller.pub( 'message', job_key )

                job_key_pubbed = True


            ( i_paused, should_quit ) = job_key.WaitIfNeeded()

            if should_quit or HydrusData.TimeHasPassed( stop_time ):

                return


            num_done = num_to_do - len( rebalance_phash_ids )

            text = 'regenerating unbalanced similar file search data - ' + HydrusData.ConvertValueRangeToPrettyString( num_done, num_to_do )

            HydrusGlobals.client_controller.pub( 'splash_set_status_text', text )
            job_key.SetVariable( 'popup_text_1', text )
            job_key.SetVariable( 'popup_gauge_1', ( num_done, num_to_do ) )

            with HydrusDB.TemporaryIntegerTable( self._c, rebalance_phash_ids, 'phash_id' ) as temp_table_name:

                ( biggest_phash_id, ) = self._c.execute( 'SELECT phash_id FROM shape_vptree, ' + temp_table_name + ' USING ( phash_id ) ORDER BY inner_population + outer_population DESC;' ).fetchone()


            self._CacheSimilarFilesRegenerateBranch( job_key, biggest_phash_id )

            rebalance_phash_ids = [ phash_id for ( phash_id, ) in self._c.execute( 'SELECT phash_id FROM shape_maintenance_branch_regen;' ) ]


        job_key.SetVariable( 'popup_text_1', 'done!' )
        job_key.DeleteVariable( 'popup_gauge_1' )
        job_key.DeleteVariable( 'popup_text_2' )

        job_key.Finish()
        job_key.Delete( 30 )


    def _CacheSimilarFilesMaintenanceDue( self ):

        result = self._c.execute( 'SELECT 1 FROM shape_maintenance_branch_regen;' ).fetchone()

        if result is not None:

            return True


        return False


    def _CacheSimilarFilesPopBestRootNode( self, node_rows ):

        if len( node_rows ) == 1:

            root_row = node_rows.pop(0)

            return root_row


        MAX_VIEWPOINTS = 256
        MAX_SAMPLE = 64

        if len( node_rows ) > MAX_VIEWPOINTS:

            viewpoints = random.sample( node_rows, MAX_VIEWPOINTS )

        else:

            viewpoints = node_rows


        if len( node_rows ) > MAX_SAMPLE:

            sample = random.sample( node_rows, MAX_SAMPLE )

        else:

            sample = node_rows


        final_scores = []

        for ( v_id, v_phash ) in viewpoints:

            views = [ HydrusData.GetHammingDistance( v_phash, s_phash ) for ( s_id, s_phash ) in sample if v_id != s_id ]

            views.sort()

            # let's figure out the ratio of left_children to right_children, preferring 1:1, and convert it to a discrete integer score

            median_index = len( views ) / 2

            radius = views[ median_index ]

            num_left = float( len( [ 1 for view in views if view < radius ] ) )
            num_radius = float( len( [ 1 for view in views if view == radius ] ) )
            num_right = float( len( [ 1 for view in views if view > radius ] ) )

            if num_left <= num_right:

                num_left += num_radius

            else:

                num_right += num_radius


            smaller = min( num_left, num_right )
            larger = max( num_left, num_right )

            ratio = smaller / larger

            ratio_score = int( ratio * MAX_SAMPLE / 2 )

            # now let's calc the standard deviation--larger sd tends to mean less sphere overlap when searching

            mean_view = sum( views ) / float( len( views ) )
            squared_diffs = [ ( view - mean_view  ) ** 2 for view in views ]
            sd = ( sum( squared_diffs ) / len( squared_diffs ) ) ** 0.5

            final_scores.append( ( ratio_score, sd, v_id ) )


        final_scores.sort()

        # we now have a list like [ ( 11, 4.0, [id] ), ( 15, 3.7, [id] ), ( 15, 4.3, [id] ) ]

        ( ratio_gumpf, sd_gumpf, root_id ) = final_scores.pop()

        for ( i, ( v_id, v_phash ) ) in enumerate( node_rows ):

            if v_id == root_id:

                root_row = node_rows.pop( i )

                return root_row


    def _CacheSimilarFilesRegenerateBranch( self, job_key, phash_id ):

        job_key.SetVariable( 'popup_text_2', 'reviewing existing branch' )

        # grab everything in the branch

        ( parent_id, ) = self._c.execute( 'SELECT parent_id FROM shape_vptree WHERE phash_id = ?;', ( phash_id, ) ).fetchone()

        cte_table_name = 'branch ( branch_phash_id )'
        initial_select = 'SELECT ?'
        recursive_select = 'SELECT phash_id FROM shape_vptree, branch ON parent_id = branch_phash_id'

        with_clause = 'WITH RECURSIVE ' + cte_table_name + ' AS ( ' + initial_select + ' UNION ALL ' +  recursive_select +  ')'

        unbalanced_nodes = self._c.execute( with_clause + ' SELECT branch_phash_id, phash FROM branch, shape_perceptual_hashes ON phash_id = branch_phash_id;', ( phash_id, ) ).fetchall()

        # removal of old branch, maintenance schedule, and orphan phashes

        job_key.SetVariable( 'popup_text_2', HydrusData.ConvertIntToPrettyString( len( unbalanced_nodes ) ) + ' leaves found--now clearing out old branch' )

        unbalanced_phash_ids = { p_id for ( p_id, p_h ) in unbalanced_nodes }

        self._c.executemany( 'DELETE FROM shape_vptree WHERE phash_id = ?;', ( ( p_id, ) for p_id in unbalanced_phash_ids ) )

        self._c.executemany( 'DELETE FROM shape_maintenance_branch_regen WHERE phash_id = ?;', ( ( p_id, ) for p_id in unbalanced_phash_ids ) )

        with HydrusDB.TemporaryIntegerTable( self._c, unbalanced_phash_ids, 'phash_id' ) as temp_table_name:

            useful_phash_ids = { p_id for ( p_id, ) in self._c.execute( 'SELECT phash_id FROM shape_perceptual_hash_map, ' + temp_table_name + ' USING ( phash_id );' ) }


        orphan_phash_ids = unbalanced_phash_ids.difference( useful_phash_ids )

        self._c.executemany( 'DELETE FROM shape_perceptual_hashes WHERE phash_id = ?;', ( ( p_id, ) for p_id in orphan_phash_ids ) )

        useful_nodes = [ row for row in unbalanced_nodes if row[0] in useful_phash_ids ]

        useful_population = len( useful_nodes )

        # now create the new branch, starting by choosing a new root and updating the parent's left/right reference to that

        if useful_population > 0:

            ( new_phash_id, new_phash ) = self._CacheSimilarFilesPopBestRootNode( useful_nodes ) #HydrusData.RandomPop( useful_nodes )

        else:

            new_phash_id = None


        if parent_id is not None:

            ( parent_inner_id, ) = self._c.execute( 'SELECT inner_id FROM shape_vptree WHERE phash_id = ?;', ( parent_id, ) ).fetchone()

            if parent_inner_id == phash_id:

                query = 'UPDATE shape_vptree SET inner_id = ?, inner_population = ? WHERE phash_id = ?;'

            else:

                query = 'UPDATE shape_vptree SET outer_id = ?, outer_population = ? WHERE phash_id = ?;'


            self._c.execute( query, ( new_phash_id, useful_population, parent_id ) )


        if useful_population > 0:

            self._CacheSimilarFilesGenerateBranch( job_key, parent_id, new_phash_id, new_phash, useful_nodes )


    def _CacheSimilarFilesRegenerateTree( self ):

        job_key = ClientThreading.JobKey()

        job_key.SetVariable( 'popup_title', 'regenerating similar file search data' )

        self._controller.pub( 'message', job_key )

        job_key.SetVariable( 'popup_text_1', 'gathering all leaves' )

        self._c.execute( 'DELETE FROM shape_vptree;' )

        all_nodes = self._c.execute( 'SELECT phash_id, phash FROM shape_perceptual_hashes;' ).fetchall()

        job_key.SetVariable( 'popup_text_1', HydrusData.ConvertIntToPrettyString( len( all_nodes ) ) + ' leaves found, now regenerating' )

        ( root_id, root_phash ) = self._CacheSimilarFilesPopBestRootNode( all_nodes ) #HydrusData.RandomPop( all_nodes )

        self._CacheSimilarFilesGenerateBranch( job_key, None, root_id, root_phash, all_nodes )

        job_key.SetVariable( 'popup_text_1', 'done!' )
        job_key.DeleteVariable( 'popup_text_2' )


    def _CacheSimilarFilesSchedulePHashRegeneration( self, hash_ids = None ):

        if hash_ids is None:

            hash_ids = [ hash_id for ( hash_id, ) in self._c.execute( 'SELECT hash_id FROM files_info, current_files USING ( hash_id ) WHERE service_id = ? AND mime IN ' + HydrusData.SplayListForDB( HC.MIMES_WE_CAN_PHASH ) + ';', ( self._combined_local_file_service_id, ) ) ]


        self._c.executemany( 'INSERT OR IGNORE INTO shape_maintenance_phash_regen ( hash_id ) VALUES ( ? );', ( ( hash_id, ) for hash_id in hash_ids ) )


    def _CacheSimilarFilesSearch( self, hash_id, max_hamming_distance ):

        search_radius = max_hamming_distance

        result = self._c.execute( 'SELECT phash_id FROM shape_vptree WHERE parent_id IS NULL;' ).fetchone()

        if result is None:

            return []


        ( root_node_phash_id, ) = result

        search_phashes = [ phash for ( phash, ) in self._c.execute( 'SELECT phash FROM shape_perceptual_hashes, shape_perceptual_hash_map USING ( phash_id ) WHERE hash_id = ?;', ( hash_id, ) ) ]

        if len( search_phashes ) == 0:

            return []


        potentials = [ ( root_node_phash_id, tuple( search_phashes ) ) ]
        similar_phash_ids = set()

        num_cycles = 0

        while len( potentials ) > 0:

            num_cycles += 1

            ( node_phash_id, search_phashes ) = potentials.pop( 0 )

            ( node_phash, node_radius, inner_phash_id, outer_phash_id ) = self._c.execute( 'SELECT phash, radius, inner_id, outer_id FROM shape_perceptual_hashes, shape_vptree USING ( phash_id ) WHERE phash_id = ?;', ( node_phash_id, ) ).fetchone()

            inner_search_phashes = []
            outer_search_phashes = []

            for search_phash in search_phashes:

                # first check the node--is it similar?

                node_hamming_distance = HydrusData.GetHammingDistance( search_phash, node_phash )

                if node_hamming_distance <= search_radius:

                    similar_phash_ids.add( node_phash_id )


                # now how about its children?

                if node_radius is not None:

                    # we have two spheres--node and search--their centers separated by node_hamming_distance
                    # we want to search inside/outside the node_sphere if the search_sphere intersects with those spaces
                    # there are four possibles:
                    # (----N----)-(--S--)    intersects with outer only - distance between N and S > their radii
                    # (----N---(-)-S--)      intersects with both
                    # (----N-(--S-)-)        intersects with both
                    # (---(-N-S--)-)         intersects with inner only - distance between N and S + radius_S does not exceed radius_N

                    spheres_disjoint = node_hamming_distance > node_radius + search_radius
                    search_sphere_subset_of_node_sphere = node_hamming_distance + search_radius <= node_radius

                    if not spheres_disjoint: # i.e. they intersect at some point

                        inner_search_phashes.append( search_phash )


                    if not search_sphere_subset_of_node_sphere: # i.e. search sphere intersects with non-node sphere space at some point

                        outer_search_phashes.append( search_phash )


            if inner_phash_id is not None and len( inner_search_phashes ) > 0:

                potentials.append( ( inner_phash_id, tuple( inner_search_phashes ) ) )


            if outer_phash_id is not None and len( outer_search_phashes ) > 0:

                potentials.append( ( outer_phash_id, tuple( outer_search_phashes ) ) )


        if HydrusGlobals.db_report_mode:

            HydrusData.ShowText( 'Similar file search completed in ' + HydrusData.ConvertIntToPrettyString( num_cycles ) + ' cycles.' )


        with HydrusDB.TemporaryIntegerTable( self._c, similar_phash_ids, 'phash_id' ) as temp_table_name:

            similar_hash_ids = [ hash_id for ( hash_id, ) in self._c.execute( 'SELECT hash_id FROM shape_perceptual_hash_map, ' + temp_table_name + ' USING ( phash_id );' ) ]


        return similar_hash_ids


    def _CacheSpecificMappingsAddFiles( self, file_service_id, tag_service_id, hash_ids ):

        ( cache_files_table_name, cache_current_mappings_table_name, cache_pending_mappings_table_name, ac_cache_table_name ) = GenerateSpecificMappingsCacheTableNames( file_service_id, tag_service_id )

        self._c.executemany( 'INSERT OR IGNORE INTO ' + cache_files_table_name + ' VALUES ( ? );', ( ( hash_id, ) for hash_id in hash_ids ) )

        ( current_mappings_table_name, deleted_mappings_table_name, pending_mappings_table_name, petitioned_mappings_table_name ) = GenerateMappingsTableNames( tag_service_id )

        ac_cache_changes = []

        for group_of_hash_ids in HydrusData.SplitListIntoChunks( hash_ids, 100 ):

            splayed_group_of_hash_ids = HydrusData.SplayListForDB( group_of_hash_ids )

            current_mapping_ids_raw = self._c.execute( 'SELECT namespace_id, tag_id, hash_id FROM ' + current_mappings_table_name + ' WHERE hash_id IN ' + splayed_group_of_hash_ids + ';' ).fetchall()

            current_mapping_ids_dict = HydrusData.BuildKeyToSetDict( [ ( ( namespace_id, tag_id ), hash_id ) for ( namespace_id, tag_id, hash_id ) in current_mapping_ids_raw ] )

            pending_mapping_ids_raw = self._c.execute( 'SELECT namespace_id, tag_id, hash_id FROM ' + pending_mappings_table_name + ' WHERE hash_id IN ' + splayed_group_of_hash_ids + ';' ).fetchall()

            pending_mapping_ids_dict = HydrusData.BuildKeyToSetDict( [ ( ( namespace_id, tag_id ), hash_id ) for ( namespace_id, tag_id, hash_id ) in pending_mapping_ids_raw ] )

            all_ids_seen = set( current_mapping_ids_dict.keys() )
            all_ids_seen.update( pending_mapping_ids_dict.keys() )

            for ( namespace_id, tag_id ) in all_ids_seen:

                current_hash_ids = current_mapping_ids_dict[ ( namespace_id, tag_id ) ]

                num_current = len( current_hash_ids )

                if num_current > 0:

                    self._c.executemany( 'INSERT OR IGNORE INTO ' + cache_current_mappings_table_name + ' ( hash_id, namespace_id, tag_id ) VALUES ( ?, ?, ? );', ( ( hash_id, namespace_id, tag_id ) for hash_id in current_hash_ids ) )


                pending_hash_ids = pending_mapping_ids_dict[ ( namespace_id, tag_id ) ]

                num_pending = len( pending_hash_ids )

                if num_pending > 0:

                    self._c.executemany( 'INSERT OR IGNORE INTO ' + cache_pending_mappings_table_name + ' ( hash_id, namespace_id, tag_id ) VALUES ( ?, ?, ? );', ( ( hash_id, namespace_id, tag_id ) for hash_id in pending_hash_ids ) )


                if num_current > 0 or num_pending > 0:

                    ac_cache_changes.append( ( namespace_id, tag_id, num_current, num_pending ) )


        if len( ac_cache_changes ) > 0:

            self._c.executemany( 'INSERT OR IGNORE INTO ' + ac_cache_table_name + ' ( namespace_id, tag_id, current_count, pending_count ) VALUES ( ?, ?, ?, ? );', ( ( namespace_id, tag_id, 0, 0 ) for ( namespace_id, tag_id, num_current, num_pending ) in ac_cache_changes ) )

            self._c.executemany( 'UPDATE ' + ac_cache_table_name + ' SET current_count = current_count + ?, pending_count = pending_count + ? WHERE namespace_id = ? AND tag_id = ?;', ( ( num_current, num_pending, namespace_id, tag_id ) for ( namespace_id, tag_id, num_current, num_pending ) in ac_cache_changes ) )


    def _CacheSpecificMappingsAddMappings( self, file_service_id, tag_service_id, mappings_ids ):

        ( cache_files_table_name, cache_current_mappings_table_name, cache_pending_mappings_table_name, ac_cache_table_name ) = GenerateSpecificMappingsCacheTableNames( file_service_id, tag_service_id )

        for ( namespace_id, tag_id, hash_ids ) in mappings_ids:

            hash_ids = self._CacheSpecificMappingsFilterHashIds( file_service_id, tag_service_id, hash_ids )

            if len( hash_ids ) > 0:

                self._c.executemany( 'DELETE FROM ' + cache_pending_mappings_table_name + ' WHERE hash_id = ? AND namespace_id = ? AND tag_id = ?;', ( ( hash_id, namespace_id, tag_id ) for hash_id in hash_ids ) )

                num_pending_rescinded = self._GetRowCount()

                #

                self._c.executemany( 'INSERT OR IGNORE INTO ' + cache_current_mappings_table_name + ' ( hash_id, namespace_id, tag_id ) VALUES ( ?, ?, ? );', ( ( hash_id, namespace_id, tag_id ) for hash_id in hash_ids ) )

                num_added = self._GetRowCount()

                if num_pending_rescinded > 0:

                    self._c.execute( 'UPDATE ' + ac_cache_table_name + ' SET current_count = current_count + ?, pending_count = pending_count - ? WHERE namespace_id = ? AND tag_id = ?;', ( num_added, num_pending_rescinded, namespace_id, tag_id ) )

                elif num_added > 0:

                    self._c.execute( 'INSERT OR IGNORE INTO ' + ac_cache_table_name + ' ( namespace_id, tag_id, current_count, pending_count ) VALUES ( ?, ?, ?, ? );', ( namespace_id, tag_id, 0, 0 ) )

                    self._c.execute( 'UPDATE ' + ac_cache_table_name + ' SET current_count = current_count + ? WHERE namespace_id = ? AND tag_id = ?;', ( num_added, namespace_id, tag_id ) )


    def _CacheSpecificMappingsDrop( self, file_service_id, tag_service_id ):

        ( cache_files_table_name, cache_current_mappings_table_name, cache_pending_mappings_table_name, ac_cache_table_name ) = GenerateSpecificMappingsCacheTableNames( file_service_id, tag_service_id )

        self._c.execute( 'DROP TABLE IF EXISTS ' + cache_files_table_name + ';' )

        self._c.execute( 'DROP TABLE IF EXISTS ' + cache_current_mappings_table_name + ';' )

        self._c.execute( 'DROP TABLE IF EXISTS ' + cache_pending_mappings_table_name + ';' )

        self._c.execute( 'DROP TABLE IF EXISTS ' + ac_cache_table_name + ';' )


    def _CacheSpecificMappingsDeleteFiles( self, file_service_id, tag_service_id, hash_ids ):

        ( cache_files_table_name, cache_current_mappings_table_name, cache_pending_mappings_table_name, ac_cache_table_name ) = GenerateSpecificMappingsCacheTableNames( file_service_id, tag_service_id )

        self._c.executemany( 'DELETE FROM ' + cache_files_table_name + ' WHERE hash_id = ?;', ( ( hash_id, ) for hash_id in hash_ids ) )

        ac_cache_changes = []

        for group_of_hash_ids in HydrusData.SplitListIntoChunks( hash_ids, 100 ):

            splayed_group_of_hash_ids = HydrusData.SplayListForDB( group_of_hash_ids )

            current_mapping_ids_raw = self._c.execute( 'SELECT namespace_id, tag_id, hash_id FROM ' + cache_current_mappings_table_name + ' WHERE hash_id IN ' + splayed_group_of_hash_ids + ';' ).fetchall()

            current_mapping_ids_dict = HydrusData.BuildKeyToSetDict( [ ( ( namespace_id, tag_id ), hash_id ) for ( namespace_id, tag_id, hash_id ) in current_mapping_ids_raw ] )

            pending_mapping_ids_raw = self._c.execute( 'SELECT namespace_id, tag_id, hash_id FROM ' + cache_pending_mappings_table_name + ' WHERE hash_id IN ' + splayed_group_of_hash_ids + ';' ).fetchall()

            pending_mapping_ids_dict = HydrusData.BuildKeyToSetDict( [ ( ( namespace_id, tag_id ), hash_id ) for ( namespace_id, tag_id, hash_id ) in pending_mapping_ids_raw ] )

            all_ids_seen = set( current_mapping_ids_dict.keys() )
            all_ids_seen.update( pending_mapping_ids_dict.keys() )

            for ( namespace_id, tag_id ) in all_ids_seen:

                current_hash_ids = current_mapping_ids_dict[ ( namespace_id, tag_id ) ]

                num_current = len( current_hash_ids )

                if num_current > 0:

                    self._c.executemany( 'DELETE FROM ' + cache_current_mappings_table_name + ' WHERE namespace_id = ? AND tag_id = ? AND hash_id = ?;', ( ( namespace_id, tag_id, hash_id ) for hash_id in current_hash_ids ) )


                pending_hash_ids = pending_mapping_ids_dict[ ( namespace_id, tag_id ) ]

                num_pending = len( pending_hash_ids )

                if num_pending > 0:

                    self._c.executemany( 'DELETE FROM ' + cache_pending_mappings_table_name + ' WHERE namespace_id = ? AND tag_id = ? AND hash_id = ?;', ( ( namespace_id, tag_id, hash_id ) for hash_id in pending_hash_ids ) )


                ac_cache_changes.append( ( namespace_id, tag_id, num_current, num_pending ) )


        if len( ac_cache_changes ) > 0:

            self._c.executemany( 'UPDATE ' + ac_cache_table_name + ' SET current_count = current_count - ?, pending_count = pending_count - ? WHERE namespace_id = ? AND tag_id = ?;', ( ( num_current, num_pending, namespace_id, tag_id ) for ( namespace_id, tag_id, num_current, num_pending ) in ac_cache_changes ) )

            self._c.executemany( 'DELETE FROM ' + ac_cache_table_name + ' WHERE namespace_id = ? AND tag_id = ? AND current_count = ? AND pending_count = ?;', ( ( namespace_id, tag_id, 0, 0 ) for ( namespace_id, tag_id, num_current, num_pending ) in ac_cache_changes ) )


    def _CacheSpecificMappingsDeleteMappings( self, file_service_id, tag_service_id, mappings_ids ):

        ( cache_files_table_name, cache_current_mappings_table_name, cache_pending_mappings_table_name, ac_cache_table_name ) = GenerateSpecificMappingsCacheTableNames( file_service_id, tag_service_id )

        for ( namespace_id, tag_id, hash_ids ) in mappings_ids:

            hash_ids = self._CacheSpecificMappingsFilterHashIds( file_service_id, tag_service_id, hash_ids )

            if len( hash_ids ) > 0:

                self._c.executemany( 'DELETE FROM ' + cache_current_mappings_table_name + ' WHERE hash_id = ? AND namespace_id = ? AND tag_id = ?;', ( ( hash_id, namespace_id, tag_id ) for hash_id in hash_ids ) )

                num_deleted = self._GetRowCount()

                if num_deleted > 0:

                    self._c.execute( 'UPDATE ' + ac_cache_table_name + ' SET current_count = current_count - ? WHERE namespace_id = ? AND tag_id = ?;', ( num_deleted, namespace_id, tag_id ) )

                    self._c.execute( 'DELETE FROM ' + ac_cache_table_name + ' WHERE namespace_id = ? AND tag_id = ? AND current_count = ? AND pending_count = ?;', ( namespace_id, tag_id, 0, 0 ) )


    def _CacheSpecificMappingsFilterHashIds( self, file_service_id, tag_service_id, hash_ids ):

        ( cache_files_table_name, cache_current_mappings_table_name, cache_pending_mappings_table_name, ac_cache_table_name ) = GenerateSpecificMappingsCacheTableNames( file_service_id, tag_service_id )

        return [ hash_id for ( hash_id, ) in self._c.execute( 'SELECT hash_id FROM ' + cache_files_table_name + ' WHERE hash_id IN ' + HydrusData.SplayListForDB( hash_ids ) + ';' ) ]


    def _CacheSpecificMappingsGenerate( self, file_service_id, tag_service_id ):

        ( cache_files_table_name, cache_current_mappings_table_name, cache_pending_mappings_table_name, ac_cache_table_name ) = GenerateSpecificMappingsCacheTableNames( file_service_id, tag_service_id )

        self._c.execute( 'CREATE TABLE ' + cache_files_table_name + ' ( hash_id INTEGER PRIMARY KEY );' )

        self._c.execute( 'CREATE TABLE ' + cache_current_mappings_table_name + ' ( hash_id INTEGER, namespace_id INTEGER, tag_id INTEGER, PRIMARY KEY( hash_id, namespace_id, tag_id ) ) WITHOUT ROWID;' )

        self._c.execute( 'CREATE TABLE ' + cache_pending_mappings_table_name + ' ( hash_id INTEGER, namespace_id INTEGER, tag_id INTEGER, PRIMARY KEY( hash_id, namespace_id, tag_id ) ) WITHOUT ROWID;' )

        self._c.execute( 'CREATE TABLE ' + ac_cache_table_name + ' ( namespace_id INTEGER, tag_id INTEGER, current_count INTEGER, pending_count INTEGER, PRIMARY KEY( namespace_id, tag_id ) ) WITHOUT ROWID;' )

        #

        hash_ids = [ hash_id for ( hash_id, ) in self._c.execute( 'SELECT hash_id FROM current_files WHERE service_id = ?;', ( file_service_id, ) ) ]

        if len( hash_ids ) > 0:

            self._CacheSpecificMappingsAddFiles( file_service_id, tag_service_id, hash_ids )


    def _CacheSpecificMappingsGetAutocompleteCounts( self, file_service_id, tag_service_id, namespace_ids_to_tag_ids ):

        ( cache_files_table_name, cache_current_mappings_table_name, cache_pending_mappings_table_name, ac_cache_table_name ) = GenerateSpecificMappingsCacheTableNames( file_service_id, tag_service_id )

        results = []

        for ( namespace_id, tag_ids ) in namespace_ids_to_tag_ids.items():

            results.extend( ( ( namespace_id, tag_id, current_count, pending_count ) for ( tag_id, current_count, pending_count ) in self._c.execute( 'SELECT tag_id, current_count, pending_count FROM ' + ac_cache_table_name + ' WHERE namespace_id = ? AND tag_id IN ' + HydrusData.SplayListForDB( tag_ids ) + ';', ( namespace_id, ) ) ) )


        return results


    def _CacheSpecificMappingsPendMappings( self, file_service_id, tag_service_id, mappings_ids ):

        ( cache_files_table_name, cache_current_mappings_table_name, cache_pending_mappings_table_name, ac_cache_table_name ) = GenerateSpecificMappingsCacheTableNames( file_service_id, tag_service_id )

        for ( namespace_id, tag_id, hash_ids ) in mappings_ids:

            hash_ids = self._CacheSpecificMappingsFilterHashIds( file_service_id, tag_service_id, hash_ids )

            if len( hash_ids ) > 0:

                self._c.executemany( 'INSERT OR IGNORE INTO ' + cache_pending_mappings_table_name + ' ( hash_id, namespace_id, tag_id ) VALUES ( ?, ?, ? );', ( ( hash_id, namespace_id, tag_id ) for hash_id in hash_ids ) )

                num_added = self._GetRowCount()

                if num_added > 0:

                    self._c.execute( 'INSERT OR IGNORE INTO ' + ac_cache_table_name + ' ( namespace_id, tag_id, current_count, pending_count ) VALUES ( ?, ?, ?, ? );', ( namespace_id, tag_id, 0, 0 ) )

                    self._c.execute( 'UPDATE ' + ac_cache_table_name + ' SET pending_count = pending_count + ? WHERE namespace_id = ? AND tag_id = ?;', ( num_added, namespace_id, tag_id ) )


    def _CacheSpecificMappingsRescindPendingMappings( self, file_service_id, tag_service_id, mappings_ids ):

        ( cache_files_table_name, cache_current_mappings_table_name, cache_pending_mappings_table_name, ac_cache_table_name ) = GenerateSpecificMappingsCacheTableNames( file_service_id, tag_service_id )

        for ( namespace_id, tag_id, hash_ids ) in mappings_ids:

            hash_ids = self._CacheSpecificMappingsFilterHashIds( file_service_id, tag_service_id, hash_ids )

            if len( hash_ids ) > 0:

                self._c.executemany( 'DELETE FROM ' + cache_pending_mappings_table_name + ' WHERE hash_id = ? AND namespace_id = ? AND tag_id = ?;', ( ( hash_id, namespace_id, tag_id ) for hash_id in hash_ids ) )

                num_deleted = self._GetRowCount()

                if num_deleted > 0:

                    self._c.execute( 'UPDATE ' + ac_cache_table_name + ' SET pending_count = pending_count - ? WHERE namespace_id = ? AND tag_id = ?;', ( num_deleted, namespace_id, tag_id ) )

                    self._c.execute( 'DELETE FROM ' + ac_cache_table_name + ' WHERE namespace_id = ? AND tag_id = ? AND current_count = ? AND pending_count = ?;', ( namespace_id, tag_id, 0, 0 ) )


    def _CheckDBIntegrity( self ):

        prefix_string = 'checking db integrity: '

        job_key = ClientThreading.JobKey( cancellable = True )

        job_key.SetVariable( 'popup_title', prefix_string + 'preparing' )

        self._controller.pub( 'message', job_key )

        num_errors = 0

        job_key.SetVariable( 'popup_title', prefix_string + 'running' )
        job_key.SetVariable( 'popup_text_1', 'errors found so far: ' + HydrusData.ConvertIntToPrettyString( num_errors ) )

        db_names = [ name for ( index, name, path ) in self._c.execute( 'PRAGMA database_list;' ) if name not in ( 'mem', 'temp' ) ]

        for db_name in db_names:

            for ( text, ) in self._c.execute( 'PRAGMA ' + db_name + '.integrity_check;' ):

                ( i_paused, should_quit ) = job_key.WaitIfNeeded()

                if should_quit:

                    job_key.SetVariable( 'popup_title', prefix_string + 'cancelled' )
                    job_key.SetVariable( 'popup_text_1', 'errors found: ' + HydrusData.ConvertIntToPrettyString( num_errors ) )

                    return


                if text != 'ok':

                    if num_errors == 0:

                        HydrusData.Print( 'During a db integrity check, these errors were discovered:' )


                    HydrusData.Print( text )

                    num_errors += 1


                job_key.SetVariable( 'popup_text_1', 'errors found so far: ' + HydrusData.ConvertIntToPrettyString( num_errors ) )


        job_key.SetVariable( 'popup_title', prefix_string + 'completed' )
        job_key.SetVariable( 'popup_text_1', 'errors found: ' + HydrusData.ConvertIntToPrettyString( num_errors ) )

        HydrusData.Print( job_key.ToString() )

        job_key.Finish()


    def _CheckFileIntegrity( self, mode, move_location = None ):

        prefix_string = 'checking file integrity: '

        job_key = ClientThreading.JobKey( cancellable = True )

        job_key.SetVariable( 'popup_text_1', prefix_string + 'preparing' )

        self._controller.pub( 'message', job_key )

        info = self._c.execute( 'SELECT hash_id, mime FROM current_files, files_info USING ( hash_id ) WHERE service_id = ?;', ( self._combined_local_file_service_id, ) ).fetchall()

        missing_count = 0
        deletee_hash_ids = []

        client_files_manager = self._controller.GetClientFilesManager()

        for ( i, ( hash_id, mime ) ) in enumerate( info ):

            ( i_paused, should_quit ) = job_key.WaitIfNeeded()

            if should_quit:

                return


            job_key.SetVariable( 'popup_text_1', prefix_string + HydrusData.ConvertValueRangeToPrettyString( i, len( info ) ) )
            job_key.SetVariable( 'popup_gauge_1', ( i, len( info ) ) )

            hash = self._GetHash( hash_id )

            try:

                # lockless because this db call is made by the locked client files manager
                path = client_files_manager.LocklessGetFilePath( hash, mime )

            except HydrusExceptions.FileMissingException:

                print( 'Could not find the file for ' + hash.encode( 'hex' ) + '!' )

                deletee_hash_ids.append( hash_id )

                missing_count += 1

                continue


            if mode == 'thorough':

                actual_hash = HydrusFileHandling.GetHashFromPath( path )

                if actual_hash != hash:

                    deletee_hash_ids.append( hash_id )

                    if move_location is not None:

                        move_filename = 'believed ' + hash.encode( 'hex' ) + ' actually ' + actual_hash.encode( 'hex' ) + HC.mime_ext_lookup[ mime ]

                        move_path = os.path.join( move_location, move_filename )

                        HydrusPaths.MergeFile( path, move_path )


        job_key.DeleteVariable( 'popup_gauge_1' )
        job_key.SetVariable( 'popup_text_1', prefix_string + 'deleting the incorrect records' )

        self._DeleteFiles( self._local_file_service_id, deletee_hash_ids )
        self._DeleteFiles( self._trash_service_id, deletee_hash_ids )
        self._DeleteFiles( self._combined_local_file_service_id, deletee_hash_ids )

        final_text = 'done! '

        if len( deletee_hash_ids ) == 0:

            final_text += 'all files ok!'

        else:

            final_text += HydrusData.ConvertIntToPrettyString( missing_count ) + ' files were missing!'

            if mode == 'thorough':

                final_text += ' ' + HydrusData.ConvertIntToPrettyString( len( deletee_hash_ids ) - missing_count ) + ' files were incorrect and thus '

                if move_location is None:

                    final_text += 'deleted!'

                else:

                    final_text += 'moved!'


        job_key.SetVariable( 'popup_text_1', prefix_string + final_text )

        HydrusData.Print( job_key.ToString() )

        job_key.Finish()


    def _CleanUpCaches( self ):

        self._subscriptions_cache = {}
        self._service_cache = {}


    def _CreateDB( self ):

        client_files_default = os.path.join( self._db_dir, 'client_files' )

        HydrusPaths.MakeSureDirectoryExists( client_files_default )

        other_dirs = []

        other_dirs.append( self._updates_dir )

        for path in other_dirs:

            HydrusPaths.MakeSureDirectoryExists( path )


        HydrusDB.SetupDBCreatePragma( self._c, no_wal = self._no_wal )

        try: self._c.execute( 'BEGIN IMMEDIATE;' )
        except Exception as e:

            raise HydrusExceptions.DBAccessException( HydrusData.ToUnicode( e ) )


        self._c.execute( 'CREATE TABLE services ( service_id INTEGER PRIMARY KEY AUTOINCREMENT, service_key BLOB_BYTES, service_type INTEGER, name TEXT, info TEXT_YAML );' )
        self._c.execute( 'CREATE UNIQUE INDEX services_service_key_index ON services ( service_key );' )

        # main

        self._c.execute( 'CREATE TABLE analyze_timestamps ( name TEXT, num_rows INTEGER, timestamp INTEGER );' )

        self._c.execute( 'CREATE TABLE client_files_locations ( prefix TEXT, location TEXT );' )

        self._c.execute( 'CREATE TABLE contacts ( contact_id INTEGER PRIMARY KEY, contact_key BLOB_BYTES, public_key TEXT, name TEXT, host TEXT, port INTEGER );' )
        self._c.execute( 'CREATE UNIQUE INDEX contacts_contact_key_index ON contacts ( contact_key );' )
        self._c.execute( 'CREATE UNIQUE INDEX contacts_name_index ON contacts ( name );' )

        self._c.execute( 'CREATE VIRTUAL TABLE conversation_subjects USING fts4( subject );' )

        self._c.execute( 'CREATE TABLE current_files ( service_id INTEGER REFERENCES services ON DELETE CASCADE, hash_id INTEGER, timestamp INTEGER, PRIMARY KEY( service_id, hash_id ) );' )
        self._c.execute( 'CREATE INDEX current_files_timestamp ON current_files ( timestamp );' )

        self._c.execute( 'CREATE TABLE deleted_files ( service_id INTEGER REFERENCES services ON DELETE CASCADE, hash_id INTEGER, PRIMARY KEY( service_id, hash_id ) );' )

        self._c.execute( 'CREATE TABLE existing_tags ( namespace_id INTEGER, tag_id INTEGER, PRIMARY KEY( namespace_id, tag_id ) );' )
        self._c.execute( 'CREATE INDEX existing_tags_tag_id_index ON existing_tags ( tag_id );' )

        self._c.execute( 'CREATE TABLE file_inbox ( hash_id INTEGER PRIMARY KEY );' )

        self._c.execute( 'CREATE TABLE files_info ( hash_id INTEGER PRIMARY KEY, size INTEGER, mime INTEGER, width INTEGER, height INTEGER, duration INTEGER, num_frames INTEGER, num_words INTEGER );' )
        self._c.execute( 'CREATE INDEX files_info_size ON files_info ( size );' )
        self._c.execute( 'CREATE INDEX files_info_mime ON files_info ( mime );' )
        self._c.execute( 'CREATE INDEX files_info_width ON files_info ( width );' )
        self._c.execute( 'CREATE INDEX files_info_height ON files_info ( height );' )
        self._c.execute( 'CREATE INDEX files_info_duration ON files_info ( duration );' )
        self._c.execute( 'CREATE INDEX files_info_num_frames ON files_info ( num_frames );' )

        self._c.execute( 'CREATE TABLE file_transfers ( service_id INTEGER REFERENCES services ON DELETE CASCADE, hash_id INTEGER, PRIMARY KEY( service_id, hash_id ) );' )
        self._c.execute( 'CREATE INDEX file_transfers_hash_id ON file_transfers ( hash_id );' )

        self._c.execute( 'CREATE TABLE file_petitions ( service_id INTEGER REFERENCES services ON DELETE CASCADE, hash_id INTEGER, reason_id INTEGER, PRIMARY KEY( service_id, hash_id, reason_id ) );' )
        self._c.execute( 'CREATE INDEX file_petitions_hash_id_index ON file_petitions ( hash_id );' )

        self._c.execute( 'CREATE TABLE hydrus_sessions ( service_id INTEGER PRIMARY KEY REFERENCES services ON DELETE CASCADE, session_key BLOB_BYTES, expiry INTEGER );' )

        self._c.execute( 'CREATE TABLE json_dict ( name TEXT PRIMARY KEY, dump BLOB_BYTES );' )
        self._c.execute( 'CREATE TABLE json_dumps ( dump_type INTEGER PRIMARY KEY, version INTEGER, dump BLOB_BYTES );' )
        self._c.execute( 'CREATE TABLE json_dumps_named ( dump_type INTEGER, dump_name TEXT, version INTEGER, dump BLOB_BYTES, PRIMARY KEY ( dump_type, dump_name ) );' )

        self._c.execute( 'CREATE TABLE local_hashes ( hash_id INTEGER PRIMARY KEY, md5 BLOB_BYTES, sha1 BLOB_BYTES, sha512 BLOB_BYTES );' )
        self._c.execute( 'CREATE INDEX local_hashes_md5_index ON local_hashes ( md5 );' )
        self._c.execute( 'CREATE INDEX local_hashes_sha1_index ON local_hashes ( sha1 );' )
        self._c.execute( 'CREATE INDEX local_hashes_sha512_index ON local_hashes ( sha512 );' )

        self._c.execute( 'CREATE TABLE local_ratings ( service_id INTEGER REFERENCES services ON DELETE CASCADE, hash_id INTEGER, rating REAL, PRIMARY KEY( service_id, hash_id ) );' )
        self._c.execute( 'CREATE INDEX local_ratings_hash_id_index ON local_ratings ( hash_id );' )
        self._c.execute( 'CREATE INDEX local_ratings_rating_index ON local_ratings ( rating );' )

        self._c.execute( 'CREATE TABLE message_attachments ( message_id INTEGER PRIMARY KEY REFERENCES message_keys ON DELETE CASCADE, hash_id INTEGER );' )

        self._c.execute( 'CREATE TABLE message_depots ( service_id INTEGER PRIMARY KEY REFERENCES services ON DELETE CASCADE, contact_id INTEGER, last_check INTEGER, check_period INTEGER, private_key TEXT, receive_anon INTEGER_BOOLEAN );' )
        self._c.execute( 'CREATE UNIQUE INDEX message_depots_contact_id_index ON message_depots ( contact_id );' )

        self._c.execute( 'CREATE TABLE message_destination_map ( message_id INTEGER REFERENCES message_keys ON DELETE CASCADE, contact_id_to INTEGER, status_id INTEGER, PRIMARY KEY ( message_id, contact_id_to ) );' )
        self._c.execute( 'CREATE INDEX message_destination_map_contact_id_to_index ON message_destination_map ( contact_id_to );' )
        self._c.execute( 'CREATE INDEX message_destination_map_status_id_index ON message_destination_map ( status_id );' )

        self._c.execute( 'CREATE TABLE message_downloads ( service_id INTEGER REFERENCES services ON DELETE CASCADE, message_id INTEGER REFERENCES message_keys ON DELETE CASCADE );' )
        self._c.execute( 'CREATE INDEX message_downloads_service_id_index ON message_downloads ( service_id );' )

        self._c.execute( 'CREATE TABLE message_drafts ( message_id INTEGER REFERENCES message_keys ON DELETE CASCADE, recipients_visible INTEGER_BOOLEAN );' )

        self._c.execute( 'CREATE TABLE message_inbox ( message_id INTEGER PRIMARY KEY REFERENCES message_keys ON DELETE CASCADE );' )

        self._c.execute( 'CREATE TABLE message_keys ( message_id INTEGER PRIMARY KEY, message_key BLOB_BYTES );' )
        self._c.execute( 'CREATE INDEX message_keys_message_key_index ON message_keys ( message_key );' )

        self._c.execute( 'CREATE VIRTUAL TABLE message_bodies USING fts4( body );' )

        self._c.execute( 'CREATE TABLE incoming_message_statuses ( message_id INTEGER REFERENCES message_keys ON DELETE CASCADE, contact_key BLOB_BYTES, status_id INTEGER, PRIMARY KEY ( message_id, contact_key ) );' )

        self._c.execute( 'CREATE TABLE messages ( conversation_id INTEGER REFERENCES message_keys ( message_id ) ON DELETE CASCADE, message_id INTEGER REFERENCES message_keys ON DELETE CASCADE, contact_id_from INTEGER, timestamp INTEGER, PRIMARY KEY( conversation_id, message_id ) );' )
        self._c.execute( 'CREATE UNIQUE INDEX messages_message_id_index ON messages ( message_id );' )
        self._c.execute( 'CREATE INDEX messages_contact_id_from_index ON messages ( contact_id_from );' )
        self._c.execute( 'CREATE INDEX messages_timestamp_index ON messages ( timestamp );' )

        self._c.execute( 'CREATE TABLE news ( service_id INTEGER REFERENCES services ON DELETE CASCADE, post TEXT, timestamp INTEGER );' )

        self._c.execute( 'CREATE TABLE options ( options TEXT_YAML );', )

        self._c.execute( 'CREATE TABLE recent_tags ( service_id INTEGER REFERENCES services ON DELETE CASCADE, namespace_id INTEGER, tag_id INTEGER, timestamp INTEGER, PRIMARY KEY ( service_id, namespace_id, tag_id ) );' )

        self._c.execute( 'CREATE TABLE remote_ratings ( service_id INTEGER REFERENCES services ON DELETE CASCADE, hash_id INTEGER, count INTEGER, rating REAL, score REAL, PRIMARY KEY( service_id, hash_id ) );' )
        self._c.execute( 'CREATE INDEX remote_ratings_hash_id_index ON remote_ratings ( hash_id );' )
        self._c.execute( 'CREATE INDEX remote_ratings_rating_index ON remote_ratings ( rating );' )
        self._c.execute( 'CREATE INDEX remote_ratings_score_index ON remote_ratings ( score );' )

        self._c.execute( 'CREATE TABLE service_filenames ( service_id INTEGER REFERENCES services ON DELETE CASCADE, hash_id INTEGER, filename TEXT, PRIMARY KEY( service_id, hash_id ) );' )
        self._c.execute( 'CREATE TABLE service_directories ( service_id INTEGER REFERENCES services ON DELETE CASCADE, directory_id INTEGER, num_files INTEGER, total_size INTEGER, note TEXT, PRIMARY KEY( service_id, directory_id ) );' )
        self._c.execute( 'CREATE TABLE service_directory_file_map ( service_id INTEGER REFERENCES services ON DELETE CASCADE, directory_id INTEGER, hash_id INTEGER, PRIMARY KEY( service_id, directory_id, hash_id ) );' )

        self._c.execute( 'CREATE TABLE service_info ( service_id INTEGER REFERENCES services ON DELETE CASCADE, info_type INTEGER, info INTEGER, PRIMARY KEY ( service_id, info_type ) );' )

        self._c.execute( 'CREATE TABLE statuses ( status_id INTEGER PRIMARY KEY, status TEXT );' )
        self._c.execute( 'CREATE UNIQUE INDEX statuses_status_index ON statuses ( status );' )

        self._c.execute( 'CREATE TABLE tag_censorship ( service_id INTEGER PRIMARY KEY REFERENCES services ON DELETE CASCADE, blacklist INTEGER_BOOLEAN, tags TEXT_YAML );' )

        self._c.execute( 'CREATE TABLE tag_parents ( service_id INTEGER REFERENCES services ON DELETE CASCADE, child_namespace_id INTEGER, child_tag_id INTEGER, parent_namespace_id INTEGER, parent_tag_id INTEGER, status INTEGER, PRIMARY KEY ( service_id, child_namespace_id, child_tag_id, parent_namespace_id, parent_tag_id, status ) );' )
        self._c.execute( 'CREATE INDEX tag_parents_service_id_status_index ON tag_parents ( service_id, status );' )
        self._c.execute( 'CREATE INDEX tag_parents_status_index ON tag_parents ( status );' )

        self._c.execute( 'CREATE TABLE tag_parent_petitions ( service_id INTEGER REFERENCES services ON DELETE CASCADE, child_namespace_id INTEGER, child_tag_id INTEGER, parent_namespace_id INTEGER, parent_tag_id INTEGER, status INTEGER, reason_id INTEGER, PRIMARY KEY ( service_id, child_namespace_id, child_tag_id, parent_namespace_id, parent_tag_id, status ) );' )

        self._c.execute( 'CREATE TABLE tag_siblings ( service_id INTEGER REFERENCES services ON DELETE CASCADE, old_namespace_id INTEGER, old_tag_id INTEGER, new_namespace_id INTEGER, new_tag_id INTEGER, status INTEGER, PRIMARY KEY ( service_id, old_namespace_id, old_tag_id, status ) );' )
        self._c.execute( 'CREATE INDEX tag_siblings_service_id_status_index ON tag_siblings ( service_id, status );' )
        self._c.execute( 'CREATE INDEX tag_siblings_status_index ON tag_siblings ( status );' )

        self._c.execute( 'CREATE TABLE tag_sibling_petitions ( service_id INTEGER REFERENCES services ON DELETE CASCADE, old_namespace_id INTEGER, old_tag_id INTEGER, new_namespace_id INTEGER, new_tag_id INTEGER, status INTEGER, reason_id INTEGER, PRIMARY KEY ( service_id, old_namespace_id, old_tag_id, status ) );' )

        self._c.execute( 'CREATE TABLE urls ( url TEXT PRIMARY KEY, hash_id INTEGER );' )
        self._c.execute( 'CREATE INDEX urls_hash_id ON urls ( hash_id );' )

        self._c.execute( 'CREATE TABLE vacuum_timestamps ( name TEXT, timestamp INTEGER );' )

        self._c.execute( 'CREATE TABLE version ( version INTEGER );' )

        self._c.execute( 'CREATE TABLE web_sessions ( name TEXT PRIMARY KEY, cookies TEXT_YAML, expiry INTEGER );' )

        self._c.execute( 'CREATE TABLE yaml_dumps ( dump_type INTEGER, dump_name TEXT, dump TEXT_YAML, PRIMARY KEY ( dump_type, dump_name ) );' )

        # cache

        self._c.execute( 'CREATE TABLE external_caches.shape_perceptual_hashes ( phash_id INTEGER PRIMARY KEY, phash BLOB_BYTES UNIQUE );' )

        self._c.execute( 'CREATE TABLE external_caches.shape_perceptual_hash_map ( phash_id INTEGER, hash_id INTEGER, PRIMARY KEY ( phash_id, hash_id ) );' )
        self._c.execute( 'CREATE INDEX external_caches.shape_perceptual_hash_map_hash_id_index ON shape_perceptual_hash_map ( hash_id );' )

        self._c.execute( 'CREATE TABLE external_caches.shape_vptree ( phash_id INTEGER PRIMARY KEY, parent_id INTEGER, radius INTEGER, inner_id INTEGER, inner_population INTEGER, outer_id INTEGER, outer_population INTEGER );' )
        self._c.execute( 'CREATE INDEX external_caches.shape_vptree_parent_id_index ON shape_vptree ( parent_id );' )

        self._c.execute( 'CREATE TABLE external_caches.shape_maintenance_phash_regen ( hash_id INTEGER PRIMARY KEY );' )
        self._c.execute( 'CREATE TABLE external_caches.shape_maintenance_branch_regen ( phash_id INTEGER PRIMARY KEY );' )

        self._c.execute( 'CREATE TABLE external_caches.shape_search_cache ( hash_id INTEGER PRIMARY KEY, searched_distance INTEGER );' )

        self._c.execute( 'CREATE TABLE external_caches.duplicate_pairs ( smaller_hash_id INTEGER, larger_hash_id INTEGER, duplicate_type INTEGER, PRIMARY KEY( smaller_hash_id, larger_hash_id ) );' )
        self._c.execute( 'CREATE UNIQUE INDEX external_caches.duplicate_pairs_reversed_hash_ids ON duplicate_pairs ( larger_hash_id, smaller_hash_id );' )

        # master

        self._c.execute( 'CREATE TABLE IF NOT EXISTS external_master.hashes ( hash_id INTEGER PRIMARY KEY, hash BLOB_BYTES UNIQUE );' )

        self._c.execute( 'CREATE TABLE IF NOT EXISTS external_master.namespaces ( namespace_id INTEGER PRIMARY KEY, namespace TEXT UNIQUE );' )

        self._c.execute( 'CREATE TABLE IF NOT EXISTS external_master.tags ( tag_id INTEGER PRIMARY KEY, tag TEXT UNIQUE );' )

        self._c.execute( 'CREATE VIRTUAL TABLE IF NOT EXISTS external_master.tags_fts4 USING fts4( tag );' )

        self._c.execute( 'CREATE TABLE IF NOT EXISTS external_master.texts ( text_id INTEGER PRIMARY KEY, text TEXT UNIQUE );' )

        # inserts

        location = HydrusPaths.ConvertAbsPathToPortablePath( client_files_default )

        for prefix in HydrusData.IterateHexPrefixes():

            self._c.execute( 'INSERT INTO client_files_locations ( prefix, location ) VALUES ( ?, ? );', ( 'f' + prefix, location ) )
            self._c.execute( 'INSERT INTO client_files_locations ( prefix, location ) VALUES ( ?, ? );', ( 't' + prefix, location ) )
            self._c.execute( 'INSERT INTO client_files_locations ( prefix, location ) VALUES ( ?, ? );', ( 'r' + prefix, location ) )


        init_service_info = []

        init_service_info.append( ( CC.COMBINED_LOCAL_FILE_SERVICE_KEY, HC.COMBINED_LOCAL_FILE, CC.COMBINED_LOCAL_FILE_SERVICE_KEY ) )
        init_service_info.append( ( CC.LOCAL_FILE_SERVICE_KEY, HC.LOCAL_FILE_DOMAIN, 'my files' ) )
        init_service_info.append( ( CC.TRASH_SERVICE_KEY, HC.LOCAL_FILE_TRASH_DOMAIN, CC.TRASH_SERVICE_KEY ) )
        init_service_info.append( ( CC.LOCAL_TAG_SERVICE_KEY, HC.LOCAL_TAG, CC.LOCAL_TAG_SERVICE_KEY ) )
        init_service_info.append( ( CC.COMBINED_FILE_SERVICE_KEY, HC.COMBINED_FILE, CC.COMBINED_FILE_SERVICE_KEY ) )
        init_service_info.append( ( CC.COMBINED_TAG_SERVICE_KEY, HC.COMBINED_TAG, CC.COMBINED_TAG_SERVICE_KEY ) )
        init_service_info.append( ( CC.LOCAL_BOORU_SERVICE_KEY, HC.LOCAL_BOORU, CC.LOCAL_BOORU_SERVICE_KEY ) )

        self._combined_files_ac_caches = {}

        for ( service_key, service_type, name ) in init_service_info:

            info = {}

            self._AddService( service_key, service_type, name, info )


        self._c.executemany( 'INSERT INTO yaml_dumps VALUES ( ?, ?, ? );', ( ( YAML_DUMP_ID_REMOTE_BOORU, name, booru ) for ( name, booru ) in ClientDefaults.GetDefaultBoorus().items() ) )

        self._c.executemany( 'INSERT INTO yaml_dumps VALUES ( ?, ?, ? );', ( ( YAML_DUMP_ID_IMAGEBOARD, name, imageboards ) for ( name, imageboards ) in ClientDefaults.GetDefaultImageboards() ) )

        new_options = ClientData.ClientOptions( self._db_dir )

        self._SetJSONDump( new_options )

        self._c.execute( 'INSERT INTO namespaces ( namespace_id, namespace ) VALUES ( ?, ? );', ( 1, '' ) )

        self._c.execute( 'INSERT INTO version ( version ) VALUES ( ? );', ( HC.SOFTWARE_VERSION, ) )

        self._c.executemany( 'INSERT INTO json_dumps_named VALUES ( ?, ?, ?, ? );', ClientDefaults.GetDefaultScriptRows() )

        self._c.execute( 'COMMIT;' )


    def _DeleteFiles( self, service_id, hash_ids ):

        splayed_hash_ids = HydrusData.SplayListForDB( hash_ids )

        valid_hash_ids = { hash_id for ( hash_id, ) in self._c.execute( 'SELECT hash_id FROM current_files WHERE service_id = ? AND hash_id IN ' + splayed_hash_ids + ';', ( service_id, ) ) }

        if len( valid_hash_ids ) > 0:

            splayed_valid_hash_ids = HydrusData.SplayListForDB( valid_hash_ids )

            # remove them from the service

            self._c.execute( 'DELETE FROM current_files WHERE service_id = ? AND hash_id IN ' + splayed_valid_hash_ids + ';', ( service_id, ) )

            self._c.execute( 'DELETE FROM file_petitions WHERE service_id = ? AND hash_id IN ' + splayed_valid_hash_ids + ';', ( service_id, ) )

            info = self._c.execute( 'SELECT size, mime FROM files_info WHERE hash_id IN ' + splayed_valid_hash_ids + ';' ).fetchall()

            num_files = len( valid_hash_ids )
            delta_size = sum( ( size for ( size, mime ) in info ) )
            num_inbox = len( valid_hash_ids.intersection( self._inbox_hash_ids ) )

            service_info_updates = []

            service_info_updates.append( ( -delta_size, service_id, HC.SERVICE_INFO_TOTAL_SIZE ) )
            service_info_updates.append( ( -num_files, service_id, HC.SERVICE_INFO_NUM_FILES ) )
            service_info_updates.append( ( -num_inbox, service_id, HC.SERVICE_INFO_NUM_INBOX ) )

            # now do special stuff

            service = self._GetService( service_id )

            service_type = service.GetServiceType()

            # record the deleted row if appropriate

            if service_id == self._combined_local_file_service_id or service_type == HC.FILE_REPOSITORY:

                service_info_updates.append( ( num_files, service_id, HC.SERVICE_INFO_NUM_DELETED_FILES ) )

                self._c.executemany( 'INSERT OR IGNORE INTO deleted_files ( service_id, hash_id ) VALUES ( ?, ? );', [ ( service_id, hash_id ) for hash_id in valid_hash_ids ] )


            # if we maintain tag counts for this service, update

            if service_type in HC.AUTOCOMPLETE_CACHE_SPECIFIC_FILE_SERVICES:

                tag_service_ids = self._GetServiceIds( HC.TAG_SERVICES )

                for tag_service_id in tag_service_ids:

                    self._CacheSpecificMappingsDeleteFiles( service_id, tag_service_id, valid_hash_ids )


            # if the files are no longer in any local file services, send them to the trash

            local_file_service_ids = self._GetServiceIds( ( HC.LOCAL_FILE_DOMAIN, ) )

            if service_id in local_file_service_ids:

                splayed_local_file_service_ids = HydrusData.SplayListForDB( local_file_service_ids )

                non_orphan_hash_ids = { hash_id for ( hash_id, ) in self._c.execute( 'SELECT hash_id FROM current_files WHERE hash_id IN ' + splayed_valid_hash_ids + ' AND service_id IN ' + splayed_local_file_service_ids + ';' ) }

                orphan_hash_ids = valid_hash_ids.difference( non_orphan_hash_ids )

                if len( orphan_hash_ids ) > 0:

                    now = HydrusData.GetNow()

                    delete_rows = [ ( hash_id, now ) for hash_id in orphan_hash_ids ]

                    self._AddFiles( self._trash_service_id, delete_rows )


            # if the files are being fully deleted, then physically delete them

            if service_id == self._combined_local_file_service_id:

                self._DeletePhysicalFiles( valid_hash_ids )


            # push the info updates, notify

            self._c.executemany( 'UPDATE service_info SET info = info + ? WHERE service_id = ? AND info_type = ?;', service_info_updates )

            self.pub_after_commit( 'notify_new_pending' )


        return valid_hash_ids


    def _DeleteHydrusSessionKey( self, service_key ):

        service_id = self._GetServiceId( service_key )

        self._c.execute( 'DELETE FROM hydrus_sessions WHERE service_id = ?;', ( service_id, ) )


    def _DeleteJSONDump( self, dump_type ):

        self._c.execute( 'DELETE FROM json_dumps WHERE dump_type = ?;', ( dump_type, ) )


    def _DeleteJSONDumpNamed( self, dump_type, dump_name = None ):

        if dump_name is None:

            self._c.execute( 'DELETE FROM json_dumps_named WHERE dump_type = ?;', ( dump_type, ) )

        else:

            self._c.execute( 'DELETE FROM json_dumps_named WHERE dump_type = ? AND dump_name = ?;', ( dump_type, dump_name ) )


    def _DeletePending( self, service_key ):

        service_id = self._GetServiceId( service_key )

        service = self._GetService( service_id )

        if service.GetServiceType() == HC.TAG_REPOSITORY:

            ( current_mappings_table_name, deleted_mappings_table_name, pending_mappings_table_name, petitioned_mappings_table_name ) = GenerateMappingsTableNames( service_id )

            pending_rescinded_mappings_ids = HydrusData.BuildKeyToListDict( [ ( ( namespace_id, tag_id ), hash_id ) for ( namespace_id, tag_id, hash_id ) in self._c.execute( 'SELECT namespace_id, tag_id, hash_id FROM ' + pending_mappings_table_name + ';' ) ] )

            pending_rescinded_mappings_ids = [ ( namespace_id, tag_id, hash_ids ) for ( ( namespace_id, tag_id ), hash_ids ) in pending_rescinded_mappings_ids.items() ]

            petitioned_rescinded_mappings_ids = HydrusData.BuildKeyToListDict( [ ( ( namespace_id, tag_id ), hash_id ) for ( namespace_id, tag_id, hash_id ) in self._c.execute( 'SELECT namespace_id, tag_id, hash_id FROM ' + petitioned_mappings_table_name + ';' ) ] )

            petitioned_rescinded_mappings_ids = [ ( namespace_id, tag_id, hash_ids ) for ( ( namespace_id, tag_id ), hash_ids ) in petitioned_rescinded_mappings_ids.items() ]

            self._UpdateMappings( service_id, pending_rescinded_mappings_ids = pending_rescinded_mappings_ids, petitioned_rescinded_mappings_ids = petitioned_rescinded_mappings_ids )

            self._c.execute( 'DELETE FROM tag_sibling_petitions WHERE service_id = ?;', ( service_id, ) )
            self._c.execute( 'DELETE FROM tag_parent_petitions WHERE service_id = ?;', ( service_id, ) )

        elif service.GetServiceType() in ( HC.FILE_REPOSITORY, HC.IPFS ):

            self._c.execute( 'DELETE FROM file_transfers WHERE service_id = ?;', ( service_id, ) )
            self._c.execute( 'DELETE FROM file_petitions WHERE service_id = ?;', ( service_id, ) )


        self.pub_after_commit( 'notify_new_pending' )
        self.pub_after_commit( 'notify_new_siblings_data' )
        self.pub_after_commit( 'notify_new_siblings_gui' )
        self.pub_after_commit( 'notify_new_parents' )

        self.pub_service_updates_after_commit( { service_key : [ HydrusData.ServiceUpdate( HC.SERVICE_UPDATE_DELETE_PENDING ) ] } )


    def _DeletePhysicalFiles( self, hash_ids ):

        self._ArchiveFiles( hash_ids )

        hash_ids = set( hash_ids )

        potentially_pending_upload_hash_ids = { hash_id for ( hash_id, ) in self._c.execute( 'SELECT hash_id FROM file_transfers;', ) }

        deletable_file_hash_ids = hash_ids.difference( potentially_pending_upload_hash_ids )

        client_files_manager = self._controller.GetClientFilesManager()

        if len( deletable_file_hash_ids ) > 0:

            file_hashes = self._GetHashes( deletable_file_hash_ids )

            self._controller.CallToThread( client_files_manager.DelayedDeleteFiles, file_hashes )


        useful_thumbnail_hash_ids = { hash_id for ( hash_id, ) in self._c.execute( 'SELECT hash_id FROM current_files WHERE hash_id IN ' + HydrusData.SplayListForDB( hash_ids ) + ';' ) }

        deletable_thumbnail_hash_ids = hash_ids.difference( useful_thumbnail_hash_ids )

        if len( deletable_thumbnail_hash_ids ) > 0:

            thumbnail_hashes = self._GetHashes( deletable_thumbnail_hash_ids )

            self._controller.CallToThread( client_files_manager.DelayedDeleteThumbnails, thumbnail_hashes )


        for hash_id in hash_ids:

            self._CacheSimilarFilesDelete( hash_id )


    def _DeleteService( self, service_id, delete_update_dir = True ):

        service = self._GetService( service_id )

        service_key = service.GetServiceKey()
        service_type = service.GetServiceType()

        self._c.execute( 'DELETE FROM services WHERE service_id = ?;', ( service_id, ) )

        if service_type in HC.TAG_SERVICES:

            ( current_mappings_table_name, deleted_mappings_table_name, pending_mappings_table_name, petitioned_mappings_table_name ) = GenerateMappingsTableNames( service_id )

            self._c.execute( 'DROP TABLE ' + current_mappings_table_name + ';' )
            self._c.execute( 'DROP TABLE ' + deleted_mappings_table_name + ';' )
            self._c.execute( 'DROP TABLE ' + pending_mappings_table_name + ';' )
            self._c.execute( 'DROP TABLE ' + petitioned_mappings_table_name + ';' )

            #

            self._CacheCombinedFilesMappingsDrop( service_id )

            file_service_ids = self._GetServiceIds( HC.AUTOCOMPLETE_CACHE_SPECIFIC_FILE_SERVICES )

            for file_service_id in file_service_ids:

                self._CacheSpecificMappingsDrop( file_service_id, service_id )


        if service_type in HC.AUTOCOMPLETE_CACHE_SPECIFIC_FILE_SERVICES:

            tag_service_ids = self._GetServiceIds( HC.TAG_SERVICES )

            for tag_service_id in tag_service_ids:

                self._CacheSpecificMappingsDrop( service_id, tag_service_id )


        if service_id in self._service_cache:

            del self._service_cache[ service_id ]


        if delete_update_dir:

            update_dir = ClientFiles.GetExpectedUpdateDir( service_key )

            if os.path.exists( update_dir ):

                ClientData.DeletePath( update_dir )


        service_update = HydrusData.ServiceUpdate( HC.SERVICE_UPDATE_RESET )

        service_keys_to_service_updates = { service_key : [ service_update ] }

        self.pub_service_updates_after_commit( service_keys_to_service_updates )


    def _DeleteServiceDirectory( self, service_id, dirname ):

        directory_id = self._GetTextId( dirname )

        self._c.execute( 'DELETE FROM service_directories WHERE service_id = ? AND directory_id = ?;', ( service_id, directory_id ) )
        self._c.execute( 'DELETE FROM service_directory_file_map WHERE service_id = ? AND directory_id = ?;', ( service_id, directory_id ) )


    def _DeleteServiceInfo( self ):

        self._c.execute( 'DELETE FROM service_info;' )

        self.pub_after_commit( 'notify_new_pending' )


    def _DeleteYAMLDump( self, dump_type, dump_name = None ):

        if dump_name is None: self._c.execute( 'DELETE FROM yaml_dumps WHERE dump_type = ?;', ( dump_type, ) )
        else:

            if dump_type == YAML_DUMP_ID_SUBSCRIPTION and dump_name in self._subscriptions_cache: del self._subscriptions_cache[ dump_name ]

            if dump_type == YAML_DUMP_ID_LOCAL_BOORU: dump_name = dump_name.encode( 'hex' )

            self._c.execute( 'DELETE FROM yaml_dumps WHERE dump_type = ? AND dump_name = ?;', ( dump_type, dump_name ) )


        if dump_type == YAML_DUMP_ID_LOCAL_BOORU:

            service_id = self._GetServiceId( CC.LOCAL_BOORU_SERVICE_KEY )

            self._c.execute( 'DELETE FROM service_info WHERE service_id = ? AND info_type = ?;', ( service_id, HC.SERVICE_INFO_NUM_SHARES ) )

            self._controller.pub( 'refresh_local_booru_shares' )


    def _ExportToTagArchive( self, path, service_key, hash_type, hashes = None ):

        # This could nicely take a whitelist or a blacklist for namespace filtering

        prefix_string = 'exporting to tag archive: '

        job_key = ClientThreading.JobKey( cancellable = True )

        job_key.SetVariable( 'popup_text_1', prefix_string + 'preparing' )

        self._controller.pub( 'message', job_key )

        service_id = self._GetServiceId( service_key )

        ( current_mappings_table_name, deleted_mappings_table_name, pending_mappings_table_name, petitioned_mappings_table_name ) = GenerateMappingsTableNames( service_id )

        hta_exists = os.path.exists( path )

        hta = HydrusTagArchive.HydrusTagArchive( path )

        if hta_exists and hta.GetHashType() != hash_type:

            raise Exception( 'This tag archive does not use the expected hash type, so it cannot be exported to!' )


        if hashes is None:

            include_current = True
            include_pending = False

            hash_ids = self._GetHashIdsThatHaveTags( service_key, include_current, include_pending )

        else:

            hash_ids = self._GetHashIds( hashes )


        hta.BeginBigJob()

        for ( i, hash_id ) in enumerate( hash_ids ):

            ( i_paused, should_quit ) = job_key.WaitIfNeeded()

            if should_quit:

                return


            if i % 100 == 0:

                job_key.SetVariable( 'popup_text_1', prefix_string + HydrusData.ConvertValueRangeToPrettyString( i, len( hash_ids ) ) )
                job_key.SetVariable( 'popup_gauge_1', ( i, len( hash_ids ) ) )


            if hash_type == HydrusTagArchive.HASH_TYPE_SHA256: archive_hash = self._GetHash( hash_id )
            else:

                if hash_type == HydrusTagArchive.HASH_TYPE_MD5: h = 'md5'
                elif hash_type == HydrusTagArchive.HASH_TYPE_SHA1: h = 'sha1'
                elif hash_type == HydrusTagArchive.HASH_TYPE_SHA512: h = 'sha512'

                result = self._c.execute( 'SELECT ' + h + ' FROM local_hashes WHERE hash_id = ?;', ( hash_id, ) ).fetchone()

                if result is None: continue

                ( archive_hash, ) = result


            tags = { HydrusTags.CombineTag( namespace, tag ) for ( namespace, tag ) in self._c.execute( 'SELECT namespace, tag FROM namespaces, ( tags, ' + current_mappings_table_name + ' USING ( tag_id ) ) USING ( namespace_id ) WHERE hash_id = ?;', ( hash_id, ) ) }

            hta.AddMappings( archive_hash, tags )


        job_key.DeleteVariable( 'popup_gauge_1' )
        job_key.SetVariable( 'popup_text_1', prefix_string + 'committing the change and vacuuming the archive' )

        hta.CommitBigJob()

        job_key.SetVariable( 'popup_text_1', prefix_string + 'done!' )

        HydrusData.Print( job_key.ToString() )

        job_key.Finish()


    def _FilterHashes( self, hashes, file_service_key ):

        if file_service_key == CC.COMBINED_FILE_SERVICE_KEY:

            return hashes


        service_id = self._GetServiceId( file_service_key )

        hashes_result = []

        for hash in hashes:

            if not self._HashExists( hash ):

                continue


            hash_id = self._GetHashId( hash )

            result = self._c.execute( 'SELECT 1 FROM current_files WHERE service_id = ?;', ( service_id, ) ).fetchone()

            if result is not None:

                hashes_result.append( hash )


        return hashes_result


    def _GetAutocompleteCounts( self, tag_service_id, file_service_id, namespace_id_tag_ids, there_was_a_namespace, add_namespaceless ):

        namespace_ids_to_tag_ids = HydrusData.BuildKeyToListDict( namespace_id_tag_ids )

        if tag_service_id == self._combined_tag_service_id:

            search_tag_service_ids = self._GetServiceIds( HC.TAG_SERVICES )

        else:

            search_tag_service_ids = [ tag_service_id ]


        if file_service_id == self._combined_file_service_id:

            cache_results = self._CacheCombinedFilesMappingsGetAutocompleteCounts( tag_service_id, namespace_ids_to_tag_ids )

        else:

            cache_results = []

            for search_tag_service_id in search_tag_service_ids:

                cache_results.extend( self._CacheSpecificMappingsGetAutocompleteCounts( file_service_id, search_tag_service_id, namespace_ids_to_tag_ids ) )


        #

        ids_to_count = {}

        if not there_was_a_namespace and add_namespaceless:

            added_namespaceless_ids_to_count = {}
            tag_ids_to_incidence_count = collections.Counter()


        def add_count_to_dict( d, key, c_min, c_max, p_min, p_max ):

            if key in d:

                ( current_min, current_max, pending_min, pending_max ) = d[ key ]

                ( current_min, current_max ) = ClientData.MergeCounts( current_min, current_max, c_min, c_max )
                ( pending_min, pending_max ) = ClientData.MergeCounts( pending_min, pending_max, p_min, p_max )

            else:

                ( current_min, current_max, pending_min, pending_max ) = ( c_min, c_max, p_min, p_max )


            d[ key ] = ( current_min, current_max, pending_min, pending_max )


        for ( namespace_id, tag_id, current_count, pending_count ) in cache_results:

            add_count_to_dict( ids_to_count, ( namespace_id, tag_id ), current_count, None, pending_count, None )

            # prepare to add any namespaced counts to the namespaceless count

            if not there_was_a_namespace and add_namespaceless and ( current_count > 0 or pending_count > 0 ):

                tag_ids_to_incidence_count[ tag_id ] += 1

                if namespace_id != 1:

                    add_count_to_dict( added_namespaceless_ids_to_count, tag_id, current_count, None, pending_count, None )


        if not there_was_a_namespace and add_namespaceless:

            for ( tag_id, incidence ) in tag_ids_to_incidence_count.items():

                # any instances of namespaceless counts that are just copies of a single namespaced count are not useful
                # e.g. 'series:evangelion (300)' is not benefitted by adding 'evangelion (300)'
                # so do not add them

                if incidence > 1 and tag_id in added_namespaceless_ids_to_count:

                    ( current_min, current_max, pending_min, pending_max ) = added_namespaceless_ids_to_count[ tag_id ]

                    add_count_to_dict( ids_to_count, ( 1, tag_id ), current_min, current_max, pending_min, pending_max )


        return ids_to_count


    def _GetAutocompleteNamespaceIdTagIds( self, service_key, search_text, exact_match ):

        if exact_match:

            if not self._TagExists( search_text ):

                return set()


            ( namespace_id, tag_id ) = self._GetNamespaceIdTagId( search_text )

            if ':' in search_text:

                predicates_phrase = 'namespace_id = ' + str( namespace_id ) + ' AND tag_id = ' + str( tag_id )

            else:

                predicates_phrase = 'tag_id = ' + str( tag_id )


        else:

            normal_characters = set( 'abcdefghijklmnopqrstuvwxyz0123456789' )

            search_text_can_be_matched = True

            for character in search_text:

                if character not in normal_characters:

                    search_text_can_be_matched = False

                    break


            def GetPossibleTagIds( half_complete_tag ):

                # the issue is that the tokenizer for fts4 doesn't like weird characters
                # a search for '[s' actually only does 's'
                # so, let's do the old and slower LIKE instead of MATCH in weird cases

                # note that queries with '*' are also passed to LIKE, because MATCH only supports appended wildcards 'gun*', and not complex stuff like '*gun*'

                if search_text_can_be_matched:

                    return [ tag_id for ( tag_id, ) in self._c.execute( 'SELECT docid FROM tags_fts4 WHERE tag MATCH ?;', ( '"' + half_complete_tag + '*"', ) ) ]

                else:

                    possible_tag_ids_half_complete_tag = half_complete_tag

                    if '*' in possible_tag_ids_half_complete_tag:

                        possible_tag_ids_half_complete_tag = possible_tag_ids_half_complete_tag.replace( '*', '%' )

                    else:

                        possible_tag_ids_half_complete_tag += '%'


                    return [ tag_id for ( tag_id, ) in self._c.execute( 'SELECT tag_id FROM tags WHERE tag LIKE ? OR tag LIKE ?;', ( possible_tag_ids_half_complete_tag, '% ' + possible_tag_ids_half_complete_tag ) ) ]


            if ':' in search_text:

                ( namespace, half_complete_tag ) = search_text.split( ':', 1 )

                if half_complete_tag == '':

                    return set()

                else:

                    if '*' in namespace:

                        wildcard_namespace = namespace.replace( '*', '%' )

                        possible_namespace_ids = [ namespace_id for ( namespace_id, ) in self._c.execute( 'SELECT namespace_id FROM namespaces WHERE namespace LIKE ?;', ( wildcard_namespace, ) ) ]

                        predicates_phrase_1 = 'namespace_id IN ' + HydrusData.SplayListForDB( possible_namespace_ids )

                    else:

                        result = self._c.execute( 'SELECT namespace_id FROM namespaces WHERE namespace = ?;', ( namespace, ) ).fetchone()

                        if result is None:

                            return set()

                        else:

                            ( namespace_id, ) = result

                            predicates_phrase_1 = 'namespace_id = ' + str( namespace_id )


                    possible_tag_ids = GetPossibleTagIds( half_complete_tag )

                    predicates_phrase = predicates_phrase_1 + ' AND tag_id IN ' + HydrusData.SplayListForDB( possible_tag_ids )


            else:

                possible_tag_ids = GetPossibleTagIds( search_text )

                predicates_phrase = 'tag_id IN ' + HydrusData.SplayListForDB( possible_tag_ids )


        namespace_id_tag_ids = { namespace_id_tag_id for namespace_id_tag_id in self._c.execute( 'SELECT namespace_id, tag_id FROM existing_tags WHERE ' + predicates_phrase + ';' ) }

        # now fetch siblings, add to namespace_id_tag_ids set

        siblings_manager = self._controller.GetManager( 'tag_siblings' )

        all_associated_sibling_tags = siblings_manager.GetAutocompleteSiblings( service_key, search_text, exact_match )

        for sibling_tag in all_associated_sibling_tags:

            try: ( namespace_id, tag_id ) = self._GetNamespaceIdTagId( sibling_tag )
            except HydrusExceptions.SizeException: continue

            namespace_id_tag_ids.add( ( namespace_id, tag_id ) )


        return namespace_id_tag_ids


    def _GetAutocompletePredicates( self, tag_service_key = CC.COMBINED_TAG_SERVICE_KEY, file_service_key = CC.COMBINED_FILE_SERVICE_KEY, search_text = '', exact_match = False, inclusive = True, include_current = True, include_pending = True, add_namespaceless = False, collapse_siblings = False ):

        namespace_id_tag_ids = self._GetAutocompleteNamespaceIdTagIds( tag_service_key, search_text, exact_match )

        tag_service_id = self._GetServiceId( tag_service_key )
        file_service_id = self._GetServiceId( file_service_key )

        there_was_a_namespace = ':' in search_text

        if tag_service_id == self._combined_tag_service_id:

            search_tag_service_ids = self._GetServiceIds( HC.TAG_SERVICES )

        else:

            search_tag_service_ids = [ tag_service_id ]


        all_predicates = []

        tag_censorship_manager = self._controller.GetManager( 'tag_censorship' )

        siblings_manager = HydrusGlobals.client_controller.GetManager( 'tag_siblings' )

        for search_tag_service_id in search_tag_service_ids:

            search_tag_service_key = self._GetService( search_tag_service_id ).GetServiceKey()

            ids_to_count = self._GetAutocompleteCounts( search_tag_service_id, file_service_id, namespace_id_tag_ids, there_was_a_namespace, add_namespaceless )

            #

            namespace_id_tag_ids_to_namespace_tags = self._GetNamespaceIdTagIdsToNamespaceTags( ids_to_count.keys() )

            tags_and_counts_generator = ( ( namespace_id_tag_ids_to_namespace_tags[ id ], ids_to_count[ id ] ) for id in ids_to_count.keys() )

            predicates = [ ClientSearch.Predicate( HC.PREDICATE_TYPE_TAG, tag, inclusive, min_current_count = min_current_count, min_pending_count = min_pending_count, max_current_count = max_current_count, max_pending_count = max_pending_count ) for ( tag, ( min_current_count, max_current_count, min_pending_count, max_pending_count ) ) in tags_and_counts_generator ]

            if collapse_siblings:

                predicates = siblings_manager.CollapsePredicates( search_tag_service_key, predicates )


            predicates = tag_censorship_manager.FilterPredicates( search_tag_service_key, predicates )

            all_predicates.extend( predicates )


        predicates = ClientData.MergePredicates( all_predicates )

        return predicates


    def _GetBigTableNamesToAnalyze( self, force_reanalyze = False ):

        db_names = [ name for ( index, name, path ) in self._c.execute( 'PRAGMA database_list;' ) if name not in ( 'mem', 'temp' ) ]

        all_names = set()

        for db_name in db_names:

            all_names.update( ( name for ( name, ) in self._c.execute( 'SELECT name FROM ' + db_name + '.sqlite_master WHERE type = ?;', ( 'table', ) ) ) )


        all_names.discard( 'sqlite_stat1' )

        if force_reanalyze:

            names_to_analyze = list( all_names )

        else:

            # The idea here is that some tables get huge faster than the normal maintenance cycle (usually after syncing to big repo)
            # They then search real slow for like 14 days. And then after that they don't need new analyzes tbh
            # Analyze on a small table takes ~1ms, so let's instead frequently do smaller tables and then catch them and throttle down as they grow

            big_table_minimum = 10000
            huge_table_minimum = 1000000

            small_table_stale_time_delta = 86400
            big_table_stale_time_delta = 30 * 86400
            huge_table_stale_time_delta = 30 * 86400 * 6

            existing_names_to_info = { name : ( num_rows, timestamp ) for ( name, num_rows, timestamp ) in self._c.execute( 'SELECT name, num_rows, timestamp FROM analyze_timestamps;' ) }

            names_to_analyze = []

            for name in all_names:

                if name in existing_names_to_info:

                    ( num_rows, timestamp ) = existing_names_to_info[ name ]

                    if num_rows > big_table_minimum:

                        if num_rows > huge_table_minimum:

                            due_time = timestamp + huge_table_stale_time_delta

                        else:

                            due_time = timestamp + big_table_stale_time_delta


                        if HydrusData.TimeHasPassed( due_time ):

                            names_to_analyze.append( name )


                    else:

                        # these usually take a couple of milliseconds, so just sneak them in here. no need to bother the user with a prompt
                        if HydrusData.TimeHasPassed( timestamp + small_table_stale_time_delta ):

                            self._AnalyzeTable( name )


                else:

                    names_to_analyze.append( name )


        return names_to_analyze


    def _GetClientFilesLocations( self ):

        result = { prefix : HydrusPaths.ConvertPortablePathToAbsPath( location ) for ( prefix, location ) in self._c.execute( 'SELECT prefix, location FROM client_files_locations;' ) }

        return result


    def _GetDownloads( self ):

        return { hash for ( hash, ) in self._c.execute( 'SELECT hash FROM file_transfers, hashes USING ( hash_id ) WHERE service_id = ?;', ( self._combined_local_file_service_id, ) ) }


    def _GetFileHashes( self, given_hashes, given_hash_type, desired_hash_type ):

        if given_hash_type == 'sha256':

            hash_ids = self._GetHashIds( given_hashes )

        else:

            hash_ids = []

            for given_hash in given_hashes:

                if given_hash is None:

                    continue


                result = self._c.execute( 'SELECT hash_id FROM local_hashes WHERE ' + given_hash_type + ' = ?;', ( sqlite3.Binary( given_hash ), ) ).fetchone()

                if result is not None:

                    ( hash_id, ) = result

                    hash_ids.append( hash_id )


        if desired_hash_type == 'sha256':

            desired_hashes = self._GetHashes( hash_ids )

        else:

            desired_hashes = [ desired_hash for ( desired_hash, ) in self._c.execute( 'SELECT ' + desired_hash_type + ' FROM local_hashes WHERE hash_id IN ' + HydrusData.SplayListForDB( hash_ids ) + ';' ) ]


        return desired_hashes


    def _GetFileSystemPredicates( self, service_key ):

        service_id = self._GetServiceId( service_key )

        service = self._GetService( service_id )

        service_type = service.GetServiceType()

        predicates = []

        if service_type in ( HC.COMBINED_FILE, HC.COMBINED_TAG ):

            predicates.extend( [ ClientSearch.Predicate( predicate_type, None ) for predicate_type in [ HC.PREDICATE_TYPE_SYSTEM_EVERYTHING, HC.PREDICATE_TYPE_SYSTEM_UNTAGGED, HC.PREDICATE_TYPE_SYSTEM_NUM_TAGS, HC.PREDICATE_TYPE_SYSTEM_LIMIT, HC.PREDICATE_TYPE_SYSTEM_HASH ] ] )

        elif service_type in HC.TAG_SERVICES:

            service_info = self._GetServiceInfoSpecific( service_id, service_type, { HC.SERVICE_INFO_NUM_FILES } )

            num_everything = service_info[ HC.SERVICE_INFO_NUM_FILES ]

            predicates.append( ClientSearch.Predicate( HC.PREDICATE_TYPE_SYSTEM_EVERYTHING, min_current_count = num_everything ) )

            predicates.extend( [ ClientSearch.Predicate( predicate_type, None ) for predicate_type in [ HC.PREDICATE_TYPE_SYSTEM_UNTAGGED, HC.PREDICATE_TYPE_SYSTEM_NUM_TAGS, HC.PREDICATE_TYPE_SYSTEM_LIMIT, HC.PREDICATE_TYPE_SYSTEM_HASH ] ] )

        elif service_type in HC.FILE_SERVICES:

            service_info = self._GetServiceInfoSpecific( service_id, service_type, { HC.SERVICE_INFO_NUM_FILES, HC.SERVICE_INFO_NUM_INBOX } )

            num_everything = service_info[ HC.SERVICE_INFO_NUM_FILES ]
            num_inbox = service_info[ HC.SERVICE_INFO_NUM_INBOX ]
            num_archive = num_everything - num_inbox

            if service_type == HC.FILE_REPOSITORY:

                ( num_local, ) = self._c.execute( 'SELECT COUNT( * ) FROM current_files AS remote_current_files, current_files USING ( hash_id ) WHERE remote_current_files.service_id = ? AND current_files.service_id = ?;', ( service_id, self._combined_local_file_service_id ) ).fetchone()

                num_not_local = num_everything - num_local

                num_archive = num_local - num_inbox


            predicates.append( ClientSearch.Predicate( HC.PREDICATE_TYPE_SYSTEM_EVERYTHING, min_current_count = num_everything ) )

            show_inbox_and_archive = True

            new_options = self._controller.GetNewOptions()

            if new_options.GetBoolean( 'filter_inbox_and_archive_predicates' ) and ( num_inbox == 0 or num_archive == 0 ):

                show_inbox_and_archive = False


            if show_inbox_and_archive:

                predicates.append( ClientSearch.Predicate( HC.PREDICATE_TYPE_SYSTEM_INBOX, min_current_count = num_inbox ) )
                predicates.append( ClientSearch.Predicate( HC.PREDICATE_TYPE_SYSTEM_ARCHIVE, min_current_count = num_archive ) )


            if service_type == HC.FILE_REPOSITORY:

                predicates.append( ClientSearch.Predicate( HC.PREDICATE_TYPE_SYSTEM_LOCAL, min_current_count = num_local ) )
                predicates.append( ClientSearch.Predicate( HC.PREDICATE_TYPE_SYSTEM_NOT_LOCAL, min_current_count = num_not_local ) )


            predicates.extend( [ ClientSearch.Predicate( predicate_type ) for predicate_type in [ HC.PREDICATE_TYPE_SYSTEM_UNTAGGED, HC.PREDICATE_TYPE_SYSTEM_NUM_TAGS, HC.PREDICATE_TYPE_SYSTEM_LIMIT, HC.PREDICATE_TYPE_SYSTEM_SIZE, HC.PREDICATE_TYPE_SYSTEM_AGE, HC.PREDICATE_TYPE_SYSTEM_HASH, HC.PREDICATE_TYPE_SYSTEM_DIMENSIONS, HC.PREDICATE_TYPE_SYSTEM_DURATION, HC.PREDICATE_TYPE_SYSTEM_NUM_WORDS, HC.PREDICATE_TYPE_SYSTEM_MIME ] ] )

            ratings_service_ids = self._GetServiceIds( HC.RATINGS_SERVICES )

            if len( ratings_service_ids ) > 0: predicates.append( ClientSearch.Predicate( HC.PREDICATE_TYPE_SYSTEM_RATING ) )

            predicates.extend( [ ClientSearch.Predicate( predicate_type ) for predicate_type in [ HC.PREDICATE_TYPE_SYSTEM_SIMILAR_TO, HC.PREDICATE_TYPE_SYSTEM_FILE_SERVICE ] ] )


        return predicates


    def _GetHash( self, hash_id ):

        result = self._c.execute( 'SELECT hash FROM hashes WHERE hash_id = ?;', ( hash_id, ) ).fetchone()

        if result is None:

            raise HydrusExceptions.DataMissing( 'File hash error in database' )


        ( hash, ) = result

        return hash


    def _GetHashes( self, hash_ids ): return [ hash for ( hash, ) in self._c.execute( 'SELECT hash FROM hashes WHERE hash_id IN ' + HydrusData.SplayListForDB( hash_ids ) + ';' ) ]

    def _GetHashId( self, hash ):

        result = self._c.execute( 'SELECT hash_id FROM hashes WHERE hash = ?;', ( sqlite3.Binary( hash ), ) ).fetchone()

        if result is None:

            self._c.execute( 'INSERT INTO hashes ( hash ) VALUES ( ? );', ( sqlite3.Binary( hash ), ) )

            hash_id = self._c.lastrowid

        else: ( hash_id, ) = result

        return hash_id


    def _GetHashIds( self, hashes ):

        hash_ids = set()
        hashes_not_in_db = set()

        for hash in hashes:

            if hash is None:

                continue


            result = self._c.execute( 'SELECT hash_id FROM hashes WHERE hash = ?;', ( sqlite3.Binary( hash ), ) ).fetchone()

            if result is None:

                hashes_not_in_db.add( hash )

            else:

                ( hash_id, ) = result

                hash_ids.add( hash_id )


        if len( hashes_not_in_db ) > 0:

            self._c.executemany( 'INSERT INTO hashes ( hash ) VALUES( ? );', ( ( sqlite3.Binary( hash ), ) for hash in hashes_not_in_db ) )

            for hash in hashes_not_in_db:

                ( hash_id, ) = self._c.execute( 'SELECT hash_id FROM hashes WHERE hash = ?;', ( sqlite3.Binary( hash ), ) ).fetchone()

                hash_ids.add( hash_id )


        return hash_ids


    def _GetHashIdsFromNamespace( self, file_service_key, tag_service_key, namespace, include_current_tags, include_pending_tags ):

        file_service_id = self._GetServiceId( file_service_key )
        tag_service_id = self._GetServiceId( tag_service_key )
        namespace_id = self._GetNamespaceId( namespace )

        current_selects = []
        pending_selects = []

        if tag_service_key == CC.COMBINED_TAG_SERVICE_KEY:

            search_tag_service_ids = self._GetServiceIds( HC.TAG_SERVICES )

        else:

            search_tag_service_ids = [ tag_service_id ]


        for search_tag_service_id in search_tag_service_ids:

            ( current_mappings_table_name, deleted_mappings_table_name, pending_mappings_table_name, petitioned_mappings_table_name ) = GenerateMappingsTableNames( search_tag_service_id )

            if file_service_key == CC.COMBINED_FILE_SERVICE_KEY:

                current_selects.append( 'SELECT hash_id FROM ' + current_mappings_table_name + ' WHERE namespace_id = ' + str( namespace_id ) + ';' )
                pending_selects.append( 'SELECT hash_id FROM ' + pending_mappings_table_name + ' WHERE namespace_id = ' + str( namespace_id ) + ';' )

            else:

                current_selects.append( 'SELECT hash_id FROM ' + current_mappings_table_name + ', current_files USING ( hash_id ) WHERE current_files.service_id = ' + str( file_service_id ) + ' AND namespace_id = ' + str( namespace_id ) + ';' )
                pending_selects.append( 'SELECT hash_id FROM ' + pending_mappings_table_name + ', current_files USING ( hash_id ) WHERE current_files.service_id = ' + str( file_service_id ) + ' AND namespace_id = ' + str( namespace_id ) + ';' )


        hash_ids = set()

        if include_current_tags:

            for current_select in current_selects:

                hash_ids.update( ( id for ( id, ) in self._c.execute( current_select ) ) )


        if include_pending_tags:

            for pending_select in pending_selects:

                hash_ids.update( ( id for ( id, ) in self._c.execute( pending_select ) ) )


        return hash_ids


    def _GetHashIdsFromQuery( self, search_context ):

        self._controller.ResetIdleTimer()

        system_predicates = search_context.GetSystemPredicates()

        file_service_key = search_context.GetFileServiceKey()
        tag_service_key = search_context.GetTagServiceKey()

        file_service_id = self._GetServiceId( file_service_key )
        tag_service_id = self._GetServiceId( tag_service_key )

        file_service = self._GetService( file_service_id )
        tag_service = self._GetService( tag_service_id )

        file_service_type = file_service.GetServiceType()
        tag_service_type = tag_service.GetServiceType()

        tags_to_include = search_context.GetTagsToInclude()
        tags_to_exclude = search_context.GetTagsToExclude()

        namespaces_to_include = search_context.GetNamespacesToInclude()
        namespaces_to_exclude = search_context.GetNamespacesToExclude()

        wildcards_to_include = search_context.GetWildcardsToInclude()
        wildcards_to_exclude = search_context.GetWildcardsToExclude()

        include_current_tags = search_context.IncludeCurrentTags()
        include_pending_tags = search_context.IncludePendingTags()

        #

        files_info_predicates = []

        simple_preds = system_predicates.GetSimpleInfo()

        # This now overrides any other predicates, including file domain

        if 'hash' in simple_preds:

            query_hash_ids = set()

            ( search_hash, search_hash_type ) = simple_preds[ 'hash' ]

            if search_hash_type != 'sha256':

                result = self._GetFileHashes( [ search_hash ], search_hash_type, 'sha256' )

                if len( result ) > 0:

                    ( search_hash, ) = result

                    hash_id = self._GetHashId( search_hash )

                    query_hash_ids = { hash_id }


            else:

                if self._HashExists( search_hash ):

                    hash_id = self._GetHashId( search_hash )

                    query_hash_ids = { hash_id }


            return query_hash_ids


        if 'min_size' in simple_preds: files_info_predicates.append( 'size > ' + str( simple_preds[ 'min_size' ] ) )
        if 'size' in simple_preds: files_info_predicates.append( 'size = ' + str( simple_preds[ 'size' ] ) )
        if 'max_size' in simple_preds: files_info_predicates.append( 'size < ' + str( simple_preds[ 'max_size' ] ) )

        if 'mimes' in simple_preds:

            mimes = simple_preds[ 'mimes' ]

            if len( mimes ) == 1:

                ( mime, ) = mimes

                files_info_predicates.append( 'mime = ' + str( mime ) )

            else: files_info_predicates.append( 'mime IN ' + HydrusData.SplayListForDB( mimes ) )


        if file_service_key != CC.COMBINED_FILE_SERVICE_KEY:

            if 'min_timestamp' in simple_preds: files_info_predicates.append( 'timestamp >= ' + str( simple_preds[ 'min_timestamp' ] ) )
            if 'max_timestamp' in simple_preds: files_info_predicates.append( 'timestamp <= ' + str( simple_preds[ 'max_timestamp' ] ) )


        if 'min_width' in simple_preds: files_info_predicates.append( 'width > ' + str( simple_preds[ 'min_width' ] ) )
        if 'width' in simple_preds: files_info_predicates.append( 'width = ' + str( simple_preds[ 'width' ] ) )
        if 'max_width' in simple_preds: files_info_predicates.append( 'width < ' + str( simple_preds[ 'max_width' ] ) )

        if 'min_height' in simple_preds: files_info_predicates.append( 'height > ' + str( simple_preds[ 'min_height' ] ) )
        if 'height' in simple_preds: files_info_predicates.append( 'height = ' + str( simple_preds[ 'height' ] ) )
        if 'max_height' in simple_preds: files_info_predicates.append( 'height < ' + str( simple_preds[ 'max_height' ] ) )

        if 'min_num_pixels' in simple_preds: files_info_predicates.append( 'width * height > ' + str( simple_preds[ 'min_num_pixels' ] ) )
        if 'num_pixels' in simple_preds: files_info_predicates.append( 'width * height = ' + str( simple_preds[ 'num_pixels' ] ) )
        if 'max_num_pixels' in simple_preds: files_info_predicates.append( 'width * height < ' + str( simple_preds[ 'max_num_pixels' ] ) )

        if 'min_ratio' in simple_preds:

            ( ratio_width, ratio_height ) = simple_preds[ 'min_ratio' ]

            files_info_predicates.append( '( width * 1.0 ) / height > ' + str( float( ratio_width ) ) + ' / ' + str( ratio_height ) )

        if 'ratio' in simple_preds:

            ( ratio_width, ratio_height ) = simple_preds[ 'ratio' ]

            files_info_predicates.append( '( width * 1.0 ) / height = ' + str( float( ratio_width ) ) + ' / ' + str( ratio_height ) )

        if 'max_ratio' in simple_preds:

            ( ratio_width, ratio_height ) = simple_preds[ 'max_ratio' ]

            files_info_predicates.append( '( width * 1.0 ) / height < ' + str( float( ratio_width ) ) + ' / ' + str( ratio_height ) )


        if 'min_num_words' in simple_preds: files_info_predicates.append( 'num_words > ' + str( simple_preds[ 'min_num_words' ] ) )
        if 'num_words' in simple_preds:

            num_words = simple_preds[ 'num_words' ]

            if num_words == 0: files_info_predicates.append( '( num_words IS NULL OR num_words = 0 )' )
            else: files_info_predicates.append( 'num_words = ' + str( num_words ) )

        if 'max_num_words' in simple_preds:

            max_num_words = simple_preds[ 'max_num_words' ]

            if max_num_words == 0: files_info_predicates.append( 'num_words < ' + str( max_num_words ) )
            else: files_info_predicates.append( '( num_words < ' + str( max_num_words ) + ' OR num_words IS NULL )' )


        if 'min_duration' in simple_preds: files_info_predicates.append( 'duration > ' + str( simple_preds[ 'min_duration' ] ) )
        if 'duration' in simple_preds:

            duration = simple_preds[ 'duration' ]

            if duration == 0: files_info_predicates.append( '( duration IS NULL OR duration = 0 )' )
            else: files_info_predicates.append( 'duration = ' + str( duration ) )

        if 'max_duration' in simple_preds:

            max_duration = simple_preds[ 'max_duration' ]

            if max_duration == 0: files_info_predicates.append( 'duration < ' + str( max_duration ) )
            else: files_info_predicates.append( '( duration < ' + str( max_duration ) + ' OR duration IS NULL )' )


        if len( tags_to_include ) > 0 or len( namespaces_to_include ) > 0 or len( wildcards_to_include ) > 0:

            query_hash_ids = None

            if len( tags_to_include ) > 0:

                query_hash_ids = HydrusData.IntelligentMassIntersect( ( self._GetHashIdsFromTag( file_service_key, tag_service_key, tag, include_current_tags, include_pending_tags ) for tag in tags_to_include ) )


            if len( namespaces_to_include ) > 0:

                namespace_query_hash_ids = HydrusData.IntelligentMassIntersect( ( self._GetHashIdsFromNamespace( file_service_key, tag_service_key, namespace, include_current_tags, include_pending_tags ) for namespace in namespaces_to_include ) )

                if query_hash_ids is None: query_hash_ids = namespace_query_hash_ids
                else: query_hash_ids.intersection_update( namespace_query_hash_ids )


            if len( wildcards_to_include ) > 0:

                wildcard_query_hash_ids = HydrusData.IntelligentMassIntersect( ( self._GetHashIdsFromWildcard( file_service_key, tag_service_key, wildcard, include_current_tags, include_pending_tags ) for wildcard in wildcards_to_include ) )

                if query_hash_ids is None: query_hash_ids = wildcard_query_hash_ids
                else: query_hash_ids.intersection_update( wildcard_query_hash_ids )


            if len( files_info_predicates ) > 0:

                if file_service_key == CC.COMBINED_FILE_SERVICE_KEY:

                    query_hash_ids.intersection_update( [ id for ( id, ) in self._c.execute( 'SELECT hash_id FROM files_info WHERE ' + ' AND '.join( files_info_predicates ) + ';' ) ] )

                else:

                    files_info_predicates.insert( 0, 'service_id = ' + str( file_service_id ) )

                    query_hash_ids.intersection_update( [ id for ( id, ) in self._c.execute( 'SELECT hash_id FROM current_files, files_info USING ( hash_id ) WHERE ' + ' AND '.join( files_info_predicates ) + ';' ) ] )


        else:

            if file_service_key == CC.COMBINED_FILE_SERVICE_KEY:

                query_hash_ids = self._GetHashIdsThatHaveTags( tag_service_key, include_current_tags, include_pending_tags )

            else:

                files_info_predicates.insert( 0, 'service_id = ' + str( file_service_id ) )

                query_hash_ids = { id for ( id, ) in self._c.execute( 'SELECT hash_id FROM current_files, files_info USING ( hash_id ) WHERE ' + ' AND '.join( files_info_predicates ) + ';' ) }


        #

        if system_predicates.HasSimilarTo():

            ( similar_to_hash, max_hamming ) = system_predicates.GetSimilarTo()

            hash_id = self._GetHashId( similar_to_hash )

            similar_hash_ids = self._CacheSimilarFilesSearch( hash_id, max_hamming )

            query_hash_ids.intersection_update( similar_hash_ids )


        #

        exclude_query_hash_ids = set()

        for tag in tags_to_exclude: exclude_query_hash_ids.update( self._GetHashIdsFromTag( file_service_key, tag_service_key, tag, include_current_tags, include_pending_tags ) )

        for namespace in namespaces_to_exclude: exclude_query_hash_ids.update( self._GetHashIdsFromNamespace( file_service_key, tag_service_key, namespace, include_current_tags, include_pending_tags ) )

        for wildcard in wildcards_to_exclude: exclude_query_hash_ids.update( self._GetHashIdsFromWildcard( file_service_key, tag_service_key, wildcard, include_current_tags, include_pending_tags ) )

        query_hash_ids.difference_update( exclude_query_hash_ids )

        #

        ( file_services_to_include_current, file_services_to_include_pending, file_services_to_exclude_current, file_services_to_exclude_pending ) = system_predicates.GetFileServiceInfo()

        for service_key in file_services_to_include_current:

            service_id = self._GetServiceId( service_key )

            query_hash_ids.intersection_update( [ hash_id for ( hash_id, ) in self._c.execute( 'SELECT hash_id FROM current_files WHERE service_id = ?;', ( service_id, ) ) ] )


        for service_key in file_services_to_include_pending:

            service_id = self._GetServiceId( service_key )

            query_hash_ids.intersection_update( [ hash_id for ( hash_id, ) in self._c.execute( 'SELECT hash_id FROM file_transfers WHERE service_id = ?;', ( service_id, ) ) ] )


        for service_key in file_services_to_exclude_current:

            service_id = self._GetServiceId( service_key )

            query_hash_ids.difference_update( [ hash_id for ( hash_id, ) in self._c.execute( 'SELECT hash_id FROM current_files WHERE service_id = ?;', ( service_id, ) ) ] )


        for service_key in file_services_to_exclude_pending:

            service_id = self._GetServiceId( service_key )

            query_hash_ids.difference_update( [ hash_id for ( hash_id, ) in self._c.execute( 'SELECT hash_id FROM file_transfers WHERE service_id = ?;', ( service_id, ) ) ] )


        for ( operator, value, service_key ) in system_predicates.GetRatingsPredicates():

            service_id = self._GetServiceId( service_key )

            if value == 'rated': query_hash_ids.intersection_update( [ hash_id for ( hash_id, ) in self._c.execute( 'SELECT hash_id FROM local_ratings WHERE service_id = ?;', ( service_id, ) ) ] )
            elif value == 'not rated': query_hash_ids.difference_update( [ hash_id for ( hash_id, ) in self._c.execute( 'SELECT hash_id FROM local_ratings WHERE service_id = ?;', ( service_id, ) ) ] )
            else:

                if operator == u'\u2248': predicate = str( value * 0.95 ) + ' < rating AND rating < ' + str( value * 1.05 )
                else: predicate = 'rating ' + operator + ' ' + str( value )

                query_hash_ids.intersection_update( [ hash_id for ( hash_id, ) in self._c.execute( 'SELECT hash_id FROM local_ratings WHERE service_id = ? AND ' + predicate + ';', ( service_id, ) ) ] )


        #

        must_be_local = system_predicates.MustBeLocal() or system_predicates.MustBeArchive()
        must_not_be_local = system_predicates.MustNotBeLocal()
        must_be_inbox = system_predicates.MustBeInbox()
        must_be_archive = system_predicates.MustBeArchive()

        if file_service_type in HC.LOCAL_FILE_SERVICES:

            if must_not_be_local:

                query_hash_ids = set()


        elif must_be_local or must_not_be_local:

            local_hash_ids = [ id for ( id, ) in self._c.execute( 'SELECT hash_id FROM current_files WHERE service_id = ?;', ( self._combined_local_file_service_id, ) ) ]

            if must_be_local:

                query_hash_ids.intersection_update( local_hash_ids )

            elif must_not_be_local:

                query_hash_ids.difference_update( local_hash_ids )


        if must_be_inbox:

            query_hash_ids.intersection_update( self._inbox_hash_ids )

        elif must_be_archive:

            query_hash_ids.difference_update( self._inbox_hash_ids )


        #

        num_tags_zero = False
        num_tags_nonzero = False
        max_num_tags_exists = False

        tag_predicates = []

        if 'min_num_tags' in simple_preds:

            min_num_tags = simple_preds[ 'min_num_tags' ]

            if min_num_tags == 0:

                num_tags_nonzero = True

            else:

                tag_predicates.append( lambda x: x > min_num_tags )


        if 'num_tags' in simple_preds:

            num_tags = simple_preds[ 'num_tags' ]

            if num_tags == 0:

                num_tags_zero = True

            else:

                tag_predicates.append( lambda x: x == num_tags )


        if 'max_num_tags' in simple_preds:

            max_num_tags = simple_preds[ 'max_num_tags' ]

            if max_num_tags == 1:

                num_tags_zero = True

            else:

                tag_predicates.append( lambda x: x < max_num_tags )


        tag_predicates_care_about_zero_counts = len( tag_predicates ) > 0 and False not in ( pred( 0 ) for pred in tag_predicates )

        if num_tags_zero or num_tags_nonzero or tag_predicates_care_about_zero_counts:

            nonzero_tag_query_hash_ids = self._GetHashIdsThatHaveTags( tag_service_key, include_current_tags, include_pending_tags, query_hash_ids )

            if num_tags_zero:

                query_hash_ids.difference_update( nonzero_tag_query_hash_ids )

            elif num_tags_nonzero:

                query_hash_ids.intersection_update( nonzero_tag_query_hash_ids )


        if len( tag_predicates ) > 0:

            hash_id_tag_counts = self._GetHashIdsTagCounts( tag_service_key, include_current_tags, include_pending_tags, query_hash_ids )

            good_tag_count_hash_ids = { id for ( id, count ) in hash_id_tag_counts if False not in ( pred( count ) for pred in tag_predicates ) }

            if tag_predicates_care_about_zero_counts:

                zero_hash_ids = query_hash_ids.difference( nonzero_tag_query_hash_ids )

                good_tag_count_hash_ids.update( zero_hash_ids )


            query_hash_ids.intersection_update( good_tag_count_hash_ids )


        #

        limit = system_predicates.GetLimit()

        if limit is not None and limit <= len( query_hash_ids ):

            query_hash_ids = random.sample( query_hash_ids, limit )

        else:

            query_hash_ids = list( query_hash_ids )


        return query_hash_ids


    def _GetHashIdsFromTag( self, file_service_key, tag_service_key, tag, include_current_tags, include_pending_tags ):

        siblings_manager = self._controller.GetManager( 'tag_siblings' )

        tags = siblings_manager.GetAllSiblings( tag_service_key, tag )

        file_service_id = self._GetServiceId( file_service_key )

        if tag_service_key == CC.COMBINED_TAG_SERVICE_KEY:

            search_tag_service_ids = self._GetServiceIds( HC.TAG_SERVICES )

        else:

            search_tag_service_ids = [ self._GetServiceId( tag_service_key ) ]


        hash_ids = set()

        for tag in tags:

            if not self._TagExists( tag ):

                continue


            current_selects = []
            pending_selects = []

            try: ( namespace_id, tag_id ) = self._GetNamespaceIdTagId( tag )
            except HydrusExceptions.SizeException: continue

            if ':' in tag:

                for search_tag_service_id in search_tag_service_ids:

                    ( current_mappings_table_name, deleted_mappings_table_name, pending_mappings_table_name, petitioned_mappings_table_name ) = GenerateMappingsTableNames( search_tag_service_id )

                    if file_service_key == CC.COMBINED_FILE_SERVICE_KEY:

                        current_selects.append( 'SELECT hash_id FROM ' + current_mappings_table_name + ' WHERE namespace_id = ' + str( namespace_id ) + ' AND tag_id = ' + str( tag_id ) + ';' )
                        pending_selects.append( 'SELECT hash_id FROM ' + pending_mappings_table_name + ' WHERE namespace_id = ' + str( namespace_id ) + ' AND tag_id = ' + str( tag_id ) + ';' )

                    else:

                        current_selects.append( 'SELECT hash_id FROM ' + current_mappings_table_name + ', current_files USING ( hash_id ) WHERE current_files.service_id = ' + str( file_service_id ) + ' AND namespace_id = ' + str( namespace_id ) + ' AND tag_id = ' + str( tag_id ) + ';' )
                        pending_selects.append( 'SELECT hash_id FROM ' + pending_mappings_table_name + ', current_files USING ( hash_id ) WHERE current_files.service_id = ' + str( file_service_id ) + ' AND namespace_id = ' + str( namespace_id ) + ' AND tag_id = ' + str( tag_id ) + ';' )


            else:

                for search_tag_service_id in search_tag_service_ids:

                    ( current_mappings_table_name, deleted_mappings_table_name, pending_mappings_table_name, petitioned_mappings_table_name ) = GenerateMappingsTableNames( search_tag_service_id )

                    if file_service_key == CC.COMBINED_FILE_SERVICE_KEY:

                        current_selects.append( 'SELECT hash_id FROM ' + current_mappings_table_name + ' WHERE tag_id = ' + str( tag_id ) + ';' )
                        pending_selects.append( 'SELECT hash_id FROM ' + pending_mappings_table_name + ' WHERE tag_id = ' + str( tag_id ) + ';' )

                    else:

                        current_selects.append( 'SELECT hash_id FROM ' + current_mappings_table_name + ', current_files USING ( hash_id ) WHERE current_files.service_id = ' + str( file_service_id ) + ' AND tag_id = ' + str( tag_id ) + ';' )
                        pending_selects.append( 'SELECT hash_id FROM ' + pending_mappings_table_name + ', current_files USING ( hash_id ) WHERE current_files.service_id = ' + str( file_service_id ) + ' AND tag_id = ' + str( tag_id ) + ';' )


            if include_current_tags:

                for current_select in current_selects:

                    hash_ids.update( ( id for ( id, ) in self._c.execute( current_select ) ) )


            if include_pending_tags:

                for pending_select in pending_selects:

                    hash_ids.update( ( id for ( id, ) in self._c.execute( pending_select ) ) )


        return hash_ids


    def _GetHashIdsFromWildcard( self, file_service_key, tag_service_key, wildcard, include_current_tags, include_pending_tags ):

        def GetNamespaceIdsFromWildcard( w ):

            if '*' in w:

                w = w.replace( '*', '%' )

                return { namespace_id for ( namespace_id, ) in self._c.execute( 'SELECT namespace_id FROM namespaces WHERE namespace LIKE ?;', ( w, ) ) }

            else:

                namespace_id = self._GetNamespaceId( w )

                return [ namespace_id ]


        def GetTagIdsFromWildcard( w ):

            if '*' in w:

                w = w.replace( '*', '%' )

                return { tag_id for ( tag_id, ) in self._c.execute( 'SELECT tag_id FROM tags WHERE tag LIKE ? or tag LIKE ?;', ( w, '% ' + w ) ) }

            else:

                ( namespace_id, tag_id ) = self._GetNamespaceIdTagId( w )

                return [ tag_id ]


        file_service_id = self._GetServiceId( file_service_key )

        if tag_service_key == CC.COMBINED_TAG_SERVICE_KEY:

            search_tag_service_ids = self._GetServiceIds( HC.TAG_SERVICES )

        else:

            search_tag_service_ids = [ self._GetServiceId( tag_service_key ) ]


        current_selects = []
        pending_selects = []

        if ':' in wildcard:

            ( namespace_wildcard, tag_wildcard ) = wildcard.split( ':', 1 )

            possible_namespace_ids = GetNamespaceIdsFromWildcard( namespace_wildcard )
            possible_tag_ids = GetTagIdsFromWildcard( tag_wildcard )

            for search_tag_service_id in search_tag_service_ids:

                ( current_mappings_table_name, deleted_mappings_table_name, pending_mappings_table_name, petitioned_mappings_table_name ) = GenerateMappingsTableNames( search_tag_service_id )

                if file_service_key == CC.COMBINED_FILE_SERVICE_KEY:

                    current_selects.append( 'SELECT hash_id FROM ' + current_mappings_table_name + ' WHERE namespace_id IN ' + HydrusData.SplayListForDB( possible_namespace_ids ) + ' AND tag_id IN ' + HydrusData.SplayListForDB( possible_tag_ids ) + ';' )
                    pending_selects.append( 'SELECT hash_id FROM ' + pending_mappings_table_name + ' WHERE namespace_id IN ' + HydrusData.SplayListForDB( possible_namespace_ids ) + ' AND tag_id IN ' + HydrusData.SplayListForDB( possible_tag_ids ) + ';' )

                else:

                    current_selects.append( 'SELECT hash_id FROM ' + current_mappings_table_name + ', current_files USING ( hash_id ) WHERE current_files.service_id = ' + str( file_service_id ) + ' AND namespace_id IN ' + HydrusData.SplayListForDB( possible_namespace_ids ) + ' AND tag_id IN ' + HydrusData.SplayListForDB( possible_tag_ids ) + ';' )
                    pending_selects.append( 'SELECT hash_id FROM ' + pending_mappings_table_name + ', current_files USING ( hash_id ) WHERE current_files.service_id = ' + str( file_service_id ) + ' AND namespace_id IN ' + HydrusData.SplayListForDB( possible_namespace_ids ) + ' AND tag_id IN ' + HydrusData.SplayListForDB( possible_tag_ids ) + ';' )


        else:

            possible_tag_ids = GetTagIdsFromWildcard( wildcard )

            for search_tag_service_id in search_tag_service_ids:

                ( current_mappings_table_name, deleted_mappings_table_name, pending_mappings_table_name, petitioned_mappings_table_name ) = GenerateMappingsTableNames( search_tag_service_id )

                if file_service_key == CC.COMBINED_FILE_SERVICE_KEY:

                    current_selects.append( 'SELECT hash_id FROM ' + current_mappings_table_name + ' WHERE tag_id IN ' + HydrusData.SplayListForDB( possible_tag_ids ) + ';' )
                    pending_selects.append( 'SELECT hash_id FROM ' + pending_mappings_table_name + ' WHERE tag_id IN ' + HydrusData.SplayListForDB( possible_tag_ids ) + ';' )

                else:

                    current_selects.append( 'SELECT hash_id FROM ' + current_mappings_table_name + ', current_files USING ( hash_id ) WHERE current_files.service_id = ' + str( file_service_id ) + ' AND tag_id IN ' + HydrusData.SplayListForDB( possible_tag_ids ) + ';' )
                    pending_selects.append( 'SELECT hash_id FROM ' + pending_mappings_table_name + ', current_files USING ( hash_id ) WHERE current_files.service_id = ' + str( file_service_id ) + ' AND tag_id IN ' + HydrusData.SplayListForDB( possible_tag_ids ) + ';' )


        hash_ids = set()

        if include_current_tags:

            for current_select in current_selects:

                hash_ids.update( ( id for ( id, ) in self._c.execute( current_select ) ) )


        if include_pending_tags:

            for pending_select in pending_selects:

                hash_ids.update( ( id for ( id, ) in self._c.execute( pending_select ) ) )


        return hash_ids


    def _GetHashIdsTagCounts( self, tag_service_key, include_current, include_pending, hash_ids = None ):

        if tag_service_key == CC.COMBINED_TAG_SERVICE_KEY:

            search_tag_service_ids = self._GetServiceIds( HC.TAG_SERVICES )

        else:

            search_tag_service_ids = [ self._GetServiceId( tag_service_key ) ]


        tags_counter = collections.Counter()

        if hash_ids is None:

            for search_tag_service_id in search_tag_service_ids:

                ( current_mappings_table_name, deleted_mappings_table_name, pending_mappings_table_name, petitioned_mappings_table_name ) = GenerateMappingsTableNames( search_tag_service_id )

                if include_current:

                    for ( id, count ) in self._c.execute( 'SELECT hash_id, COUNT( DISTINCT tag_id ) FROM ' + current_mappings_table_name + ' GROUP BY hash_id, namespace_id;' ):

                        tags_counter[ id ] += count


                if include_pending:

                    for ( id, count ) in self._c.execute( 'SELECT hash_id, COUNT( DISTINCT tag_id ) FROM ' + pending_mappings_table_name + ' GROUP BY hash_id, namespace_id;' ):

                        tags_counter[ id ] += count


        else:

            with HydrusDB.TemporaryIntegerTable( self._c, hash_ids, 'hash_id' ) as temp_table_name:

                for search_tag_service_id in search_tag_service_ids:

                    ( current_mappings_table_name, deleted_mappings_table_name, pending_mappings_table_name, petitioned_mappings_table_name ) = GenerateMappingsTableNames( search_tag_service_id )

                    if include_current:

                        for ( id, count ) in self._c.execute( 'SELECT hash_id, COUNT( DISTINCT tag_id ) FROM ' + temp_table_name + ',' + current_mappings_table_name + ' USING ( hash_id ) GROUP BY hash_id, namespace_id;' ):

                            tags_counter[ id ] += count


                    if include_pending:

                        for ( id, count ) in self._c.execute( 'SELECT hash_id, COUNT( DISTINCT tag_id ) FROM ' + temp_table_name + ',' + pending_mappings_table_name + ' USING ( hash_id ) GROUP BY hash_id, namespace_id;' ):

                            tags_counter[ id ] += count


        return tags_counter.items()


    def _GetHashIdsThatHaveTags( self, tag_service_key, include_current, include_pending, hash_ids = None ):

        if tag_service_key == CC.COMBINED_TAG_SERVICE_KEY:

            search_tag_service_ids = self._GetServiceIds( HC.TAG_SERVICES )

        else:

            search_tag_service_ids = [ self._GetServiceId( tag_service_key ) ]


        nonzero_tag_hash_ids = set()

        if hash_ids is None:

            for search_tag_service_id in search_tag_service_ids:

                ( current_mappings_table_name, deleted_mappings_table_name, pending_mappings_table_name, petitioned_mappings_table_name ) = GenerateMappingsTableNames( search_tag_service_id )
                '''
                if include_current and include_pending:

                    nonzero_tag_hash_ids.update( ( id for ( id, ) in self._c.execute( 'SELECT hash_id as h FROM hashes WHERE EXISTS ( SELECT 1 FROM ' + current_mappings_table_name + ' WHERE hash_id = h ) OR EXISTS ( SELECT 1 FROM ' + pending_mappings_table_name + ' WHERE hash_id = h );' ) ) )

                elif include_current:

                    nonzero_tag_hash_ids.update( ( id for ( id, ) in self._c.execute( 'SELECT hash_id as h FROM hashes WHERE EXISTS ( SELECT 1 FROM ' + current_mappings_table_name + ' WHERE hash_id = h );' ) ) )

                elif include_pending:

                    nonzero_tag_hash_ids.update( ( id for ( id, ) in self._c.execute( 'SELECT hash_id as h FROM hashes WHERE EXISTS ( SELECT 1 FROM ' + pending_mappings_table_name + ' WHERE hash_id = h );' ) ) )

                '''

                if include_current:

                    nonzero_tag_hash_ids.update( ( id for ( id, ) in self._c.execute( 'SELECT DISTINCT hash_id FROM ' + current_mappings_table_name + ';' ) ) )


                if include_pending:

                    nonzero_tag_hash_ids.update( ( id for ( id, ) in self._c.execute( 'SELECT DISTINCT hash_id FROM ' + pending_mappings_table_name + ';' ) ) )


        else:

            with HydrusDB.TemporaryIntegerTable( self._c, hash_ids, 'hash_id' ) as temp_table_name:

                for search_tag_service_id in search_tag_service_ids:

                    ( current_mappings_table_name, deleted_mappings_table_name, pending_mappings_table_name, petitioned_mappings_table_name ) = GenerateMappingsTableNames( search_tag_service_id )

                    if include_current and include_pending:

                        nonzero_tag_hash_ids.update( ( id for ( id, ) in self._c.execute( 'SELECT hash_id as h FROM ' + temp_table_name + ' WHERE EXISTS ( SELECT 1 FROM ' + current_mappings_table_name + ' WHERE hash_id = h ) OR EXISTS ( SELECT 1 FROM ' + pending_mappings_table_name + ' WHERE hash_id = h );' ) ) )

                    elif include_current:

                        nonzero_tag_hash_ids.update( ( id for ( id, ) in self._c.execute( 'SELECT hash_id as h FROM ' + temp_table_name + ' WHERE EXISTS ( SELECT 1 FROM ' + current_mappings_table_name + ' WHERE hash_id = h );' ) ) )

                    elif include_pending:

                        nonzero_tag_hash_ids.update( ( id for ( id, ) in self._c.execute( 'SELECT hash_id as h FROM ' + temp_table_name + ' WHERE EXISTS ( SELECT 1 FROM ' + pending_mappings_table_name + ' WHERE hash_id = h );' ) ) )


        return nonzero_tag_hash_ids


    def _GetHashIdsToHashes( self, hash_ids ):

        # this is actually a bit faster than saying "hash_id IN ( bigass_list )"

        results = {}

        for hash_id in hash_ids:

            ( hash, ) = self._c.execute( 'SELECT hash FROM hashes WHERE hash_id = ?;', ( hash_id, ) ).fetchone()

            results[ hash_id ] = hash


        return results


    def _GetHashIdStatus( self, hash_id ):

        result = self._c.execute( 'SELECT 1 FROM deleted_files WHERE service_id = ? AND hash_id = ?;', ( self._combined_local_file_service_id, hash_id ) ).fetchone()

        if result is not None:

            return ( CC.STATUS_DELETED, None )


        result = self._c.execute( 'SELECT 1 FROM current_files WHERE service_id = ? AND hash_id = ?;', ( self._trash_service_id, hash_id ) ).fetchone()

        if result is not None:

            return ( CC.STATUS_DELETED, None )


        result = self._c.execute( 'SELECT 1 FROM current_files WHERE service_id = ? AND hash_id = ?;', ( self._combined_local_file_service_id, hash_id ) ).fetchone()

        if result is not None:

            hash = self._GetHash( hash_id )

            return ( CC.STATUS_REDUNDANT, hash )


        return ( CC.STATUS_NEW, None )


    def _GetHydrusSessions( self ):

        now = HydrusData.GetNow()

        self._c.execute( 'DELETE FROM hydrus_sessions WHERE ? > expiry;', ( now, ) )

        sessions = []

        results = self._c.execute( 'SELECT service_id, session_key, expiry FROM hydrus_sessions;' ).fetchall()

        for ( service_id, session_key, expires ) in results:

            service = self._GetService( service_id )

            service_key = service.GetServiceKey()

            sessions.append( ( service_key, session_key, expires ) )


        return sessions


    def _GetJSONDump( self, dump_type ):

        ( version, dump ) = self._c.execute( 'SELECT version, dump FROM json_dumps WHERE dump_type = ?;', ( dump_type, ) ).fetchone()

        serialisable_info = json.loads( dump )

        return HydrusSerialisable.CreateFromSerialisableTuple( ( dump_type, version, serialisable_info ) )


    def _GetJSONDumpNamed( self, dump_type, dump_name = None ):

        if dump_name is None:

            results = self._c.execute( 'SELECT dump_name, version, dump FROM json_dumps_named WHERE dump_type = ?;', ( dump_type, ) ).fetchall()

            objs = []

            for ( dump_name, version, dump ) in results:

                serialisable_info = json.loads( dump )

                objs.append( HydrusSerialisable.CreateFromSerialisableTuple( ( dump_type, dump_name, version, serialisable_info ) ) )


            return objs

        else:

            ( version, dump ) = self._c.execute( 'SELECT version, dump FROM json_dumps_named WHERE dump_type = ? AND dump_name = ?;', ( dump_type, dump_name ) ).fetchone()

            serialisable_info = json.loads( dump )

            return HydrusSerialisable.CreateFromSerialisableTuple( ( dump_type, dump_name, version, serialisable_info ) )


    def _GetJSONDumpNames( self, dump_type ):

        names = [ name for ( name, ) in self._c.execute( 'SELECT dump_name FROM json_dumps_named WHERE dump_type = ?;', ( dump_type, ) ) ]

        return names


    def _GetJSONSimple( self, name ):

        result = self._c.execute( 'SELECT dump FROM json_dict WHERE name = ?;', ( name, ) ).fetchone()

        if result is None:

            return None


        ( json_dump, ) = result

        value = json.loads( json_dump )

        return value


    def _GetKnownURLs( self, hash ):

        hash_id = self._GetHashId( hash )

        urls = [ url for ( url, ) in self._c.execute( 'SELECT url FROM urls WHERE hash_id = ?;', ( hash_id, ) ) ]

        return urls


    def _GetMD5Status( self, md5 ):

        result = self._c.execute( 'SELECT hash_id FROM local_hashes WHERE md5 = ?;', ( sqlite3.Binary( md5 ), ) ).fetchone()

        if result is None:

            return ( CC.STATUS_NEW, None )

        else:

            ( hash_id, ) = result

            return self._GetHashIdStatus( hash_id )


    def _GetMediaResults( self, hash_ids ):

        # get first detailed results

        with HydrusDB.TemporaryIntegerTable( self._c, hash_ids, 'hash_id' ) as temp_table_name:

            hash_ids_to_info = { hash_id : ( size, mime, width, height, duration, num_frames, num_words ) for ( hash_id, size, mime, width, height, duration, num_frames, num_words ) in self._c.execute( 'SELECT * FROM files_info, ' + temp_table_name + ' USING ( hash_id );' ) }

            hash_ids_to_hashes = self._GetHashIdsToHashes( hash_ids )

            hash_ids_to_current_file_service_ids_and_timestamps = HydrusData.BuildKeyToListDict( ( ( hash_id, ( service_id, timestamp ) ) for ( hash_id, service_id, timestamp ) in self._c.execute( 'SELECT hash_id, service_id, timestamp FROM current_files, ' + temp_table_name + ' USING ( hash_id );' ) ) )

            hash_ids_to_deleted_file_service_ids = HydrusData.BuildKeyToListDict( self._c.execute( 'SELECT hash_id, service_id FROM deleted_files, ' + temp_table_name + ' USING ( hash_id );' ) )

            hash_ids_to_pending_file_service_ids = HydrusData.BuildKeyToListDict( self._c.execute( 'SELECT hash_id, service_id FROM file_transfers, ' + temp_table_name + ' USING ( hash_id );' ) )

            hash_ids_to_petitioned_file_service_ids = HydrusData.BuildKeyToListDict( self._c.execute( 'SELECT hash_id, service_id FROM file_petitions, ' + temp_table_name + ' USING ( hash_id );' ) )

            hash_ids_to_urls = HydrusData.BuildKeyToListDict( self._c.execute( 'SELECT hash_id, url FROM urls, ' + temp_table_name + ' USING ( hash_id );' ) )

            hash_ids_to_service_ids_and_filenames = HydrusData.BuildKeyToListDict( ( ( hash_id, ( service_id, filename ) ) for ( hash_id, service_id, filename ) in self._c.execute( 'SELECT hash_id, service_id, filename FROM service_filenames, ' + temp_table_name + ' USING ( hash_id );' ) ) )

            hash_ids_to_local_ratings = HydrusData.BuildKeyToListDict( ( ( hash_id, ( service_id, rating ) ) for ( service_id, hash_id, rating ) in self._c.execute( 'SELECT service_id, hash_id, rating FROM local_ratings, ' + temp_table_name + ' USING ( hash_id );' ) ) )

            tag_data = []

            tag_service_ids = self._GetServiceIds( HC.TAG_SERVICES )

            for tag_service_id in tag_service_ids:

                ( current_mappings_table_name, deleted_mappings_table_name, pending_mappings_table_name, petitioned_mappings_table_name ) = GenerateMappingsTableNames( tag_service_id )

                tag_data.extend( ( hash_id, ( tag_service_id, HC.CURRENT, namespace_id, tag_id ) ) for ( hash_id, namespace_id, tag_id ) in self._c.execute( 'SELECT hash_id, namespace_id, tag_id FROM ' + current_mappings_table_name + ', ' + temp_table_name + ' USING ( hash_id );' ) )
                tag_data.extend( ( hash_id, ( tag_service_id, HC.DELETED, namespace_id, tag_id ) ) for ( hash_id, namespace_id, tag_id ) in self._c.execute( 'SELECT hash_id, namespace_id, tag_id FROM ' + deleted_mappings_table_name + ', ' + temp_table_name + ' USING ( hash_id );' ) )
                tag_data.extend( ( hash_id, ( tag_service_id, HC.PENDING, namespace_id, tag_id ) ) for ( hash_id, namespace_id, tag_id ) in self._c.execute( 'SELECT hash_id, namespace_id, tag_id FROM ' + pending_mappings_table_name + ', ' + temp_table_name + ' USING ( hash_id );' ) )
                tag_data.extend( ( hash_id, ( tag_service_id, HC.PETITIONED, namespace_id, tag_id ) ) for ( hash_id, namespace_id, tag_id ) in self._c.execute( 'SELECT hash_id, namespace_id, tag_id FROM ' + petitioned_mappings_table_name + ', ' + temp_table_name + ' USING ( hash_id );' ) )


            seen_namespace_id_tag_ids = { ( namespace_id, tag_id ) for ( hash_id, ( tag_service_id, status, namespace_id, tag_id ) ) in tag_data }

            hash_ids_to_raw_tag_data = HydrusData.BuildKeyToListDict( tag_data )

            namespace_id_tag_ids_to_tags = self._GetNamespaceIdTagIdsToNamespaceTags( seen_namespace_id_tag_ids )


        # build it

        service_ids_to_service_keys = { service_id : service_key for ( service_id, service_key ) in self._c.execute( 'SELECT service_id, service_key FROM services;' ) }

        media_results = []

        tag_censorship_manager = self._controller.GetManager( 'tag_censorship' )

        for hash_id in hash_ids:

            hash = hash_ids_to_hashes[ hash_id ]

            #

            inbox = hash_id in self._inbox_hash_ids

            #

            # service_id, status, namespace_id, tag_id
            raw_tag_data = hash_ids_to_raw_tag_data[ hash_id ]

            # service_id -> ( status, tag )
            service_ids_to_tag_data = HydrusData.BuildKeyToListDict( ( ( tag_service_id, ( status, namespace_id_tag_ids_to_tags[ ( namespace_id, tag_id ) ] ) ) for ( tag_service_id, status, namespace_id, tag_id ) in raw_tag_data ) )

            service_keys_to_statuses_to_tags = collections.defaultdict( HydrusData.default_dict_set )

            service_keys_to_statuses_to_tags.update( { service_ids_to_service_keys[ service_id ] : HydrusData.BuildKeyToSetDict( tag_data ) for ( service_id, tag_data ) in service_ids_to_tag_data.items() } )

            service_keys_to_statuses_to_tags = tag_censorship_manager.FilterServiceKeysToStatusesToTags( service_keys_to_statuses_to_tags )

            tags_manager = ClientMedia.TagsManager( service_keys_to_statuses_to_tags )

            #

            current_file_service_keys = { service_ids_to_service_keys[ service_id ] for ( service_id, timestamp ) in hash_ids_to_current_file_service_ids_and_timestamps[ hash_id ] }

            deleted_file_service_keys = { service_ids_to_service_keys[ service_id ] for service_id in hash_ids_to_deleted_file_service_ids[ hash_id ] }

            pending_file_service_keys = { service_ids_to_service_keys[ service_id ] for service_id in hash_ids_to_pending_file_service_ids[ hash_id ] }

            petitioned_file_service_keys = { service_ids_to_service_keys[ service_id ] for service_id in hash_ids_to_petitioned_file_service_ids[ hash_id ] }

            urls = hash_ids_to_urls[ hash_id ]

            service_ids_to_filenames = HydrusData.BuildKeyToListDict( hash_ids_to_service_ids_and_filenames[ hash_id ] )

            service_keys_to_filenames = { service_ids_to_service_keys[ service_id ] : filenames for ( service_id, filenames ) in service_ids_to_filenames.items() }

            current_file_service_keys_to_timestamps = { service_ids_to_service_keys[ service_id ] : timestamp for ( service_id, timestamp ) in hash_ids_to_current_file_service_ids_and_timestamps[ hash_id ] }

            locations_manager = ClientMedia.LocationsManager( current_file_service_keys, deleted_file_service_keys, pending_file_service_keys, petitioned_file_service_keys, urls = urls, service_keys_to_filenames = service_keys_to_filenames, current_to_timestamps = current_file_service_keys_to_timestamps )

            #

            local_ratings = { service_ids_to_service_keys[ service_id ] : rating for ( service_id, rating ) in hash_ids_to_local_ratings[ hash_id ] }

            ratings_manager = ClientRatings.RatingsManager( local_ratings )

            #

            if hash_id in hash_ids_to_info:

                ( size, mime, width, height, duration, num_frames, num_words ) = hash_ids_to_info[ hash_id ]

            else:

                ( size, mime, width, height, duration, num_frames, num_words ) = ( None, HC.APPLICATION_UNKNOWN, None, None, None, None, None )


            media_results.append( ClientMedia.MediaResult( ( hash, inbox, size, mime, width, height, duration, num_frames, num_words, tags_manager, locations_manager, ratings_manager ) ) )


        return media_results


    def _GetMediaResultsFromHashes( self, hashes ):

        query_hash_ids = set( self._GetHashIds( hashes ) )

        return self._GetMediaResults( query_hash_ids )


    def _GetMime( self, hash_id ):

        result = self._c.execute( 'SELECT mime FROM files_info WHERE hash_id = ?;', ( hash_id, ) ).fetchone()

        if result is None:

            raise HydrusExceptions.FileMissingException( 'Did not have mime information for that file!' )


        ( mime, ) = result

        return mime


    def _GetNamespaceId( self, namespace ):

        result = self._c.execute( 'SELECT namespace_id FROM namespaces WHERE namespace = ?;', ( namespace, ) ).fetchone()

        if result is None:

            self._c.execute( 'INSERT INTO namespaces ( namespace ) VALUES ( ? );', ( namespace, ) )

            namespace_id = self._c.lastrowid

        else:

            ( namespace_id, ) = result


        return namespace_id


    def _GetNamespaceIdTagId( self, tag ):

        tag = HydrusTags.CleanTag( tag )

        HydrusTags.CheckTagNotEmpty( tag )

        if ':' in tag:

            ( namespace, tag ) = tag.split( ':', 1 )

            namespace_id = self._GetNamespaceId( namespace )

        else:

            namespace_id = 1


        result = self._c.execute( 'SELECT tag_id FROM tags WHERE tag = ?;', ( tag, ) ).fetchone()

        if result is None:

            self._c.execute( 'INSERT INTO tags ( tag ) VALUES ( ? );', ( tag, ) )

            tag_id = self._c.lastrowid

            self._c.execute( 'REPLACE INTO tags_fts4 ( docid, tag ) VALUES ( ?, ? );', ( tag_id, tag ) )

        else:

            ( tag_id, ) = result


        result = self._c.execute( 'SELECT 1 FROM existing_tags WHERE namespace_id = ? AND tag_id = ?;', ( namespace_id, tag_id ) ).fetchone()

        if result is None:

            self._c.execute( 'INSERT INTO existing_tags ( namespace_id, tag_id ) VALUES ( ?, ? );', ( namespace_id, tag_id ) )


        return ( namespace_id, tag_id )


    def _GetNamespaceIdTagIdsToNamespaceTags( self, pairs ):

        namespace_ids = { namespace_id for ( namespace_id, tag_id ) in pairs }
        tag_ids = { tag_id for ( namespace_id, tag_id ) in pairs }

        with HydrusDB.TemporaryIntegerTable( self._c, namespace_ids, 'namespace_id' ) as temp_table_name:

            namespace_ids_to_namespaces = { namespace_id : namespace for ( namespace_id, namespace ) in self._c.execute( 'SELECT namespace_id, namespace FROM namespaces, ' + temp_table_name + ' USING ( namespace_id );' ) }


        with HydrusDB.TemporaryIntegerTable( self._c, tag_ids, 'tag_id' ) as temp_table_name:

            tag_ids_to_tags = { tag_id : tag for ( tag_id, tag ) in self._c.execute( 'SELECT tag_id, tag FROM tags, ' + temp_table_name + ' USING ( tag_id );' ) }


        return { ( namespace_id, tag_id ) : HydrusTags.CombineTag( namespace_ids_to_namespaces[ namespace_id ], tag_ids_to_tags[ tag_id ] ) for ( namespace_id, tag_id ) in pairs }


    def _GetNamespaceTag( self, namespace_id, tag_id ):

        result = self._c.execute( 'SELECT tag FROM tags WHERE tag_id = ?;', ( tag_id, ) ).fetchone()

        if result is None:

            raise HydrusExceptions.DataMissing( 'Tag error in database' )


        ( tag, ) = result

        if namespace_id == 1:

            return HydrusTags.CombineTag( '', tag )

        else:

            result = self._c.execute( 'SELECT namespace FROM namespaces WHERE namespace_id = ?;', ( namespace_id, ) ).fetchone()

            if result is None:

                raise HydrusExceptions.DataMissing( 'Namespace error in database' )


            ( namespace, ) = result

            return HydrusTags.CombineTag( namespace, tag )


    def _GetNews( self, service_key ):

        service_id = self._GetServiceId( service_key )

        news = self._c.execute( 'SELECT post, timestamp FROM news WHERE service_id = ?;', ( service_id, ) ).fetchall()

        return news


    def _GetNumsPending( self ):

        services = self._GetServices( ( HC.TAG_REPOSITORY, HC.FILE_REPOSITORY, HC.IPFS ) )

        pendings = {}

        for service in services:

            service_key = service.GetServiceKey()
            service_type = service.GetServiceType()

            service_id = self._GetServiceId( service_key )

            if service_type in ( HC.FILE_REPOSITORY, HC.IPFS ): info_types = { HC.SERVICE_INFO_NUM_PENDING_FILES, HC.SERVICE_INFO_NUM_PETITIONED_FILES }
            elif service_type == HC.TAG_REPOSITORY: info_types = { HC.SERVICE_INFO_NUM_PENDING_MAPPINGS, HC.SERVICE_INFO_NUM_PETITIONED_MAPPINGS, HC.SERVICE_INFO_NUM_PENDING_TAG_SIBLINGS, HC.SERVICE_INFO_NUM_PETITIONED_TAG_SIBLINGS, HC.SERVICE_INFO_NUM_PENDING_TAG_PARENTS, HC.SERVICE_INFO_NUM_PETITIONED_TAG_PARENTS }

            pendings[ service_key ] = self._GetServiceInfoSpecific( service_id, service_type, info_types )


        return pendings


    def _GetOptions( self ):

        result = self._c.execute( 'SELECT options FROM options;' ).fetchone()

        if result is None:

            options = ClientDefaults.GetClientDefaultOptions()

            self._c.execute( 'INSERT INTO options ( options ) VALUES ( ? );', ( options, ) )

        else:

            ( options, ) = result

            default_options = ClientDefaults.GetClientDefaultOptions()

            for key in default_options:

                if key not in options: options[ key ] = default_options[ key ]


        return options


    def _GetPending( self, service_key ):

        service_id = self._GetServiceId( service_key )

        service = self._GetService( service_id )

        service_type = service.GetServiceType()

        content_data_dict = HydrusData.GetEmptyDataDict()
        all_hash_ids = set()

        if service_type == HC.TAG_REPOSITORY:

            # mappings

            ( current_mappings_table_name, deleted_mappings_table_name, pending_mappings_table_name, petitioned_mappings_table_name ) = GenerateMappingsTableNames( service_id )

            pending_dict = HydrusData.BuildKeyToListDict( [ ( ( namespace_id, tag_id ), hash_id ) for ( namespace_id, tag_id, hash_id ) in self._c.execute( 'SELECT namespace_id, tag_id, hash_id FROM ' + pending_mappings_table_name + ' ORDER BY tag_id LIMIT 100;' ) ] )

            for ( ( namespace_id, tag_id ), hash_ids ) in pending_dict.items():

                pending = ( self._GetNamespaceTag( namespace_id, tag_id ), hash_ids )

                content_data_dict[ HC.CONTENT_TYPE_MAPPINGS ][ HC.CONTENT_UPDATE_PEND ].append( pending )

                all_hash_ids.update( hash_ids )


            petitioned_dict = HydrusData.BuildKeyToListDict( [ ( ( namespace_id, tag_id, reason_id ), hash_id ) for ( namespace_id, tag_id, hash_id, reason_id ) in self._c.execute( 'SELECT namespace_id, tag_id, hash_id, reason_id FROM ' + petitioned_mappings_table_name + ' ORDER BY reason_id LIMIT 100;' ) ] )

            for ( ( namespace_id, tag_id, reason_id ), hash_ids ) in petitioned_dict.items():

                petitioned = ( self._GetNamespaceTag( namespace_id, tag_id ), hash_ids, self._GetText( reason_id ) )

                content_data_dict[ HC.CONTENT_TYPE_MAPPINGS ][ HC.CONTENT_UPDATE_PETITION ].append( petitioned )

                all_hash_ids.update( hash_ids )


            # tag siblings

            pending = [ ( ( self._GetNamespaceTag( old_namespace_id, old_tag_id ), self._GetNamespaceTag( new_namespace_id, new_tag_id ) ), self._GetText( reason_id ) ) for ( old_namespace_id, old_tag_id, new_namespace_id, new_tag_id, reason_id ) in self._c.execute( 'SELECT old_namespace_id, old_tag_id, new_namespace_id, new_tag_id, reason_id FROM tag_sibling_petitions WHERE service_id = ? AND status = ? ORDER BY reason_id LIMIT 100;', ( service_id, HC.PENDING ) ).fetchall() ]

            if len( pending ) > 0:

                content_data_dict[ HC.CONTENT_TYPE_TAG_SIBLINGS ][ HC.CONTENT_UPDATE_PEND ] = pending


            petitioned = [ ( ( self._GetNamespaceTag( old_namespace_id, old_tag_id ), self._GetNamespaceTag( new_namespace_id, new_tag_id ) ), self._GetText( reason_id ) ) for ( old_namespace_id, old_tag_id, new_namespace_id, new_tag_id, reason_id ) in self._c.execute( 'SELECT old_namespace_id, old_tag_id, new_namespace_id, new_tag_id, reason_id FROM tag_sibling_petitions WHERE service_id = ? AND status = ? ORDER BY reason_id LIMIT 100;', ( service_id, HC.PETITIONED ) ).fetchall() ]

            if len( petitioned ) > 0:

                content_data_dict[ HC.CONTENT_TYPE_TAG_SIBLINGS ][ HC.CONTENT_UPDATE_PETITION ] = petitioned


            # tag parents

            pending = [ ( ( self._GetNamespaceTag( child_namespace_id, child_tag_id ), self._GetNamespaceTag( parent_namespace_id, parent_tag_id ) ), self._GetText( reason_id ) ) for ( child_namespace_id, child_tag_id, parent_namespace_id, parent_tag_id, reason_id ) in self._c.execute( 'SELECT child_namespace_id, child_tag_id, parent_namespace_id, parent_tag_id, reason_id FROM tag_parent_petitions WHERE service_id = ? AND status = ? ORDER BY reason_id LIMIT 100;', ( service_id, HC.PENDING ) ).fetchall() ]

            if len( pending ) > 0:

                content_data_dict[ HC.CONTENT_TYPE_TAG_PARENTS ][ HC.CONTENT_UPDATE_PEND ] = pending


            petitioned = [ ( ( self._GetNamespaceTag( child_namespace_id, child_tag_id ), self._GetNamespaceTag( parent_namespace_id, parent_tag_id ) ), self._GetText( reason_id ) ) for ( child_namespace_id, child_tag_id, parent_namespace_id, parent_tag_id, reason_id ) in self._c.execute( 'SELECT child_namespace_id, child_tag_id, parent_namespace_id, parent_tag_id, reason_id FROM tag_parent_petitions WHERE service_id = ? AND status = ? ORDER BY reason_id LIMIT 100;', ( service_id, HC.PETITIONED ) ).fetchall() ]

            if len( petitioned ) > 0:

                content_data_dict[ HC.CONTENT_TYPE_TAG_PARENTS ][ HC.CONTENT_UPDATE_PETITION ] = petitioned


        elif service_type == HC.FILE_REPOSITORY:

            result = self._c.execute( 'SELECT hash_id FROM file_transfers WHERE service_id = ?;', ( service_id, ) ).fetchone()

            if result is not None:

                ( hash_id, ) = result

                media_result = self._GetMediaResults( ( hash_id, ) )[ 0 ]

                return media_result


            petitioned = [ ( hash_ids, reason_id ) for ( reason_id, hash_ids ) in HydrusData.BuildKeyToListDict( self._c.execute( 'SELECT reason_id, hash_id FROM file_petitions WHERE service_id = ? ORDER BY reason_id LIMIT 100;', ( service_id, ) ) ).items() ]

            petitioned = [ ( hash_ids, self._GetText( reason_id ) ) for ( hash_ids, reason_id ) in petitioned ]

            if len( petitioned ) > 0:

                all_hash_ids = { hash_id for hash_id in itertools.chain.from_iterable( ( hash_ids for ( hash_ids, reason ) in petitioned ) ) }

                content_data_dict[ HC.CONTENT_TYPE_FILES ][ HC.CONTENT_UPDATE_PETITION ] = petitioned


        elif service_type == HC.IPFS:

            result = self._c.execute( 'SELECT hash_id FROM file_transfers WHERE service_id = ?;', ( service_id, ) ).fetchone()

            if result is not None:

                ( hash_id, ) = result

                media_result = self._GetMediaResults( ( hash_id, ) )[ 0 ]

                return media_result


            result = self._c.execute( 'SELECT hash_id FROM file_petitions WHERE service_id = ?;', ( service_id, ) ).fetchone()

            if result is not None:

                ( hash_id, ) = result

                hash = self._GetHash( hash_id )

                multihash = self._GetServiceFilename( service_id, hash_id )

                return ( hash, multihash )


        if len( content_data_dict ) > 0:

            hash_ids_to_hashes = self._GetHashIdsToHashes( all_hash_ids )

            content_update_package = HydrusData.ClientToServerContentUpdatePackage( content_data_dict, hash_ids_to_hashes )

            return content_update_package

        else:

            return None


    def _GetRecentTags( self, service_key ):

        service_id = self._GetServiceId( service_key )

        # we could be clever and do LIMIT and ORDER BY in the delete, but not all compilations of SQLite have that turned on, so let's KISS

        tag_ids_to_timestamp = { ( namespace_id, tag_id ) : timestamp for ( namespace_id, tag_id, timestamp ) in self._c.execute( 'SELECT namespace_id, tag_id, timestamp FROM recent_tags WHERE service_id = ?;', ( service_id, ) ) }

        def sort_key( key ):

            return tag_ids_to_timestamp[ key ]


        newest_first = tag_ids_to_timestamp.keys()

        newest_first.sort( key = sort_key, reverse = True )

        num_we_want = HydrusGlobals.client_controller.GetNewOptions().GetNoneableInteger( 'num_recent_tags' )

        if num_we_want == None:

            num_we_want = 20


        decayed = newest_first[ num_we_want : ]

        if len( decayed ) > 0:

            self._c.executemany( 'DELETE FROM recent_tags WHERE service_id = ? AND namespace_id = ? AND tag_id = ?;', ( ( service_id, namespace_id, tag_id ) for ( namespace_id, tag_id ) in decayed ) )


        sorted_recent_tags = [ self._GetNamespaceTag( namespace_id, tag_id ) for ( namespace_id, tag_id ) in newest_first[ : num_we_want ] ]

        return sorted_recent_tags


    def _GetRelatedTags( self, service_key, skip_hash, search_tags, max_results, max_time_to_take ):

        siblings_manager = HydrusGlobals.client_controller.GetManager( 'tag_siblings' )

        search_tags = siblings_manager.CollapseTags( service_key, search_tags )

        start = HydrusData.GetNowPrecise()

        service_id = self._GetServiceId( service_key )

        skip_hash_id = self._GetHashId( skip_hash )

        ( current_mappings_table_name, deleted_mappings_table_name, pending_mappings_table_name, petitioned_mappings_table_name ) = GenerateMappingsTableNames( service_id )

        search_namespace_ids_to_tag_ids = HydrusData.BuildKeyToListDict( [ self._GetNamespaceIdTagId( tag ) for tag in search_tags ] )

        namespace_ids = search_namespace_ids_to_tag_ids.keys()

        if len( namespace_ids ) == 0:

            return []


        random.shuffle( namespace_ids )

        time_on_this_section = max_time_to_take / 2

        # this biases namespaced tags when we are in a rush, as they are less common than unnamespaced but will get the same search time
        time_per_namespace = time_on_this_section / len( namespace_ids )

        hash_ids_counter = collections.Counter()

        for namespace_id in namespace_ids:

            namespace_start = HydrusData.GetNowPrecise()

            tag_ids = search_namespace_ids_to_tag_ids[ namespace_id ]

            random.shuffle( tag_ids )

            query = self._c.execute( 'SELECT hash_id FROM ' + current_mappings_table_name + ' WHERE namespace_id = ? AND tag_id IN ' + HydrusData.SplayListForDB( tag_ids ) + ';', ( namespace_id, ) )

            results = query.fetchmany( 100 )

            while len( results ) > 0:

                for ( hash_id, ) in results:

                    hash_ids_counter[ hash_id ] += 1


                if HydrusData.TimeHasPassedPrecise( namespace_start + time_per_namespace ):

                    break


                results = query.fetchmany( 100 )


            if HydrusData.TimeHasPassedPrecise( namespace_start + time_per_namespace ):

                break


        if skip_hash_id in hash_ids_counter:

            del hash_ids_counter[ skip_hash_id ]


        #

        if len( hash_ids_counter ) == 0:

            return []


        # this stuff is often 2, 2, 2, 2, 2, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1.....
        # the 1 stuff often produces large quantities of the same very popular tag, so your search for [ 'eva', 'female' ] will produce 'touhou' because so many 2hu images have 'female'
        # so we want to do a 'soft' intersect, only picking the files that have the greatest number of shared search_tags
        # this filters to only the '2' results, which gives us eva females and their hair colour and a few choice other popular tags for that particular domain

        [ ( gumpf, largest_count ) ] = hash_ids_counter.most_common( 1 )

        hash_ids = [ hash_id for ( hash_id, count ) in hash_ids_counter.items() if count > largest_count * 0.8 ]

        counter = collections.Counter()

        random.shuffle( hash_ids )

        for hash_id in hash_ids:

            for ( namespace_id, tag_id ) in self._c.execute( 'SELECT namespace_id, tag_id FROM ' + current_mappings_table_name + ' WHERE hash_id = ?;', ( hash_id, ) ):

                counter[ ( namespace_id, tag_id ) ] += 1


            if HydrusData.TimeHasPassedPrecise( start + max_time_to_take ):

                break


        #

        for ( namespace_id, tag_ids ) in search_namespace_ids_to_tag_ids.items():

            for tag_id in tag_ids:

                if ( namespace_id, tag_id ) in counter:

                    del counter[ ( namespace_id, tag_id ) ]


        results = counter.most_common( max_results )

        tags_to_counts = { self._GetNamespaceTag( namespace_id, tag_id ) : count for ( ( namespace_id, tag_id ), count ) in results }

        tags_to_counts = siblings_manager.CollapseTagsToCount( service_key, tags_to_counts )

        tags_to_do = tags_to_counts.keys()

        tags_to_do = { tag for tag in tags_to_counts if tag not in search_tags }

        tag_censorship_manager = self._controller.GetManager( 'tag_censorship' )

        filtered_tags = tag_censorship_manager.FilterTags( service_key, tags_to_do )

        inclusive = True
        pending_count = 0

        predicates = [ ClientSearch.Predicate( HC.PREDICATE_TYPE_TAG, tag, inclusive, tags_to_counts[ tag ], pending_count ) for tag in filtered_tags ]

        return predicates


    def _GetRemoteThumbnailHashesIShouldHave( self, service_key ):

        service_id = self._GetServiceId( service_key )

        hash_ids = { hash_id for ( hash_id, ) in self._c.execute( 'SELECT hash_id FROM current_files, files_info USING ( hash_id ) WHERE mime IN ' + HydrusData.SplayListForDB( HC.MIMES_WITH_THUMBNAILS ) + ' AND service_id = ?;', ( service_id, ) ) }

        hash_ids.difference_update( ( hash_id for ( hash_id, ) in self._c.execute( 'SELECT hash_id FROM current_files WHERE service_id = ?;', ( self._combined_local_file_service_id, ) ) ) )

        hashes = set( self._GetHashes( hash_ids ) )

        return hashes


    def _GetService( self, service_id ):

        if service_id in self._service_cache:

            service = self._service_cache[ service_id ]

        else:

            ( service_key, service_type, name, info ) = self._c.execute( 'SELECT service_key, service_type, name, info FROM services WHERE service_id = ?;', ( service_id, ) ).fetchone()

            service = ClientData.GenerateService( service_key, service_type, name, info )

            self._service_cache[ service_id ] = service


        if service.GetServiceType() == HC.LOCAL_BOORU:

            info = service.GetInfo()

            current_time_struct = time.gmtime()

            ( current_year, current_month ) = ( current_time_struct.tm_year, current_time_struct.tm_mon )

            ( booru_year, booru_month ) = info[ 'current_data_month' ]

            if current_year != booru_year or current_month != booru_month:

                info[ 'used_monthly_data' ] = 0
                info[ 'used_monthly_requests' ] = 0

                info[ 'current_data_month' ] = ( current_year, current_month )

                self._c.execute( 'UPDATE services SET info = ? WHERE service_id = ?;', ( info, service_id ) )


        return service


    def _GetServiceDirectoryHashes( self, service_key, dirname ):

        service_id = self._GetServiceId( service_key )
        directory_id = self._GetTextId( dirname )

        hash_ids = [ hash_id for ( hash_id, ) in self._c.execute( 'SELECT hash_id FROM service_directory_file_map WHERE service_id = ? AND directory_id = ?;', ( service_id, directory_id ) ) ]

        hashes = self._GetHashes( hash_ids )

        return hashes


    def _GetServiceDirectoriesInfo( self, service_key ):

        service_id = self._GetServiceId( service_key )

        incomplete_info = self._c.execute( 'SELECT directory_id, num_files, total_size, note FROM service_directories WHERE service_id = ?;', ( service_id, ) ).fetchall()

        info = [ ( self._GetText( directory_id ), num_files, total_size, note ) for ( directory_id, num_files, total_size, note ) in incomplete_info ]

        return info


    def _GetServiceFilename( self, service_id, hash_id ):

        result = self._c.execute( 'SELECT filename FROM service_filenames WHERE service_id = ? AND hash_id = ?;', ( service_id, hash_id ) ).fetchone()

        if result is None:

            raise HydrusExceptions.DataMissing( 'Service filename not found!' )


        ( filename, ) = result

        return filename


    def _GetServiceFilenames( self, service_key, hashes ):

        service_id = self._GetServiceId( service_key )
        hash_ids = self._GetHashIds( hashes )

        result = [ filename for ( filename, ) in self._c.execute( 'SELECT filename FROM service_filenames WHERE service_id = ? AND hash_id IN ' + HydrusData.SplayListForDB( hash_ids ) + ';', ( service_id, ) ) ]

        result.sort()

        return result


    def _GetServices( self, limited_types = HC.ALL_SERVICES ):

        service_ids = [ service_id for ( service_id, ) in self._c.execute( 'SELECT service_id FROM services WHERE service_type IN ' + HydrusData.SplayListForDB( limited_types ) + ';' ) ]

        services = [ self._GetService( service_id ) for service_id in service_ids ]

        return services


    def _GetServiceId( self, service_key ):

        result = self._c.execute( 'SELECT service_id FROM services WHERE service_key = ?;', ( sqlite3.Binary( service_key ), ) ).fetchone()

        if result is None:

            raise HydrusExceptions.DataMissing( 'Service id error in database' )


        ( service_id, ) = result

        return service_id


    def _GetServiceIds( self, service_types ): return [ service_id for ( service_id, ) in self._c.execute( 'SELECT service_id FROM services WHERE service_type IN ' + HydrusData.SplayListForDB( service_types ) + ';' ) ]

    def _GetServiceInfo( self, service_key ):

        service_id = self._GetServiceId( service_key )

        service = self._GetService( service_id )

        service_type = service.GetServiceType()

        if service_type == HC.COMBINED_LOCAL_FILE:

            info_types = { HC.SERVICE_INFO_NUM_FILES, HC.SERVICE_INFO_TOTAL_SIZE, HC.SERVICE_INFO_NUM_DELETED_FILES }

        elif service_type in ( HC.LOCAL_FILE_DOMAIN, HC.LOCAL_FILE_TRASH_DOMAIN ):

            info_types = { HC.SERVICE_INFO_NUM_FILES, HC.SERVICE_INFO_TOTAL_SIZE }

        elif service_type == HC.FILE_REPOSITORY:

            info_types = { HC.SERVICE_INFO_NUM_FILES, HC.SERVICE_INFO_TOTAL_SIZE, HC.SERVICE_INFO_NUM_DELETED_FILES }

        elif service_type == HC.IPFS:

            info_types = { HC.SERVICE_INFO_NUM_FILES, HC.SERVICE_INFO_TOTAL_SIZE }

        elif service_type == HC.LOCAL_TAG:

            info_types = { HC.SERVICE_INFO_NUM_FILES, HC.SERVICE_INFO_NUM_TAGS, HC.SERVICE_INFO_NUM_MAPPINGS }

        elif service_type == HC.TAG_REPOSITORY:

            info_types = { HC.SERVICE_INFO_NUM_FILES, HC.SERVICE_INFO_NUM_TAGS, HC.SERVICE_INFO_NUM_MAPPINGS, HC.SERVICE_INFO_NUM_DELETED_MAPPINGS }

        elif service_type in ( HC.LOCAL_RATING_LIKE, HC.LOCAL_RATING_NUMERICAL ):

            info_types = { HC.SERVICE_INFO_NUM_FILES }

        elif service_type == HC.LOCAL_BOORU:

            info_types = { HC.SERVICE_INFO_NUM_SHARES }

        else:

            info_types = set()


        service_info = self._GetServiceInfoSpecific( service_id, service_type, info_types )

        return service_info


    def _GetServiceInfoSpecific( self, service_id, service_type, info_types ):

        results = { info_type : info for ( info_type, info ) in self._c.execute( 'SELECT info_type, info FROM service_info WHERE service_id = ? AND info_type IN ' + HydrusData.SplayListForDB( info_types ) + ';', ( service_id, ) ) }

        if len( results ) != len( info_types ):

            info_types_hit = results.keys()

            info_types_missed = info_types.difference( info_types_hit )

            if service_type in HC.TAG_SERVICES:

                common_tag_info_types = { HC.SERVICE_INFO_NUM_FILES, HC.SERVICE_INFO_NUM_TAGS }

                if common_tag_info_types <= info_types_missed:

                    ( current_mappings_table_name, deleted_mappings_table_name, pending_mappings_table_name, petitioned_mappings_table_name ) = GenerateMappingsTableNames( service_id )

                    ( num_files, num_tags ) = self._c.execute( 'SELECT COUNT( DISTINCT hash_id ), COUNT( DISTINCT tag_id ) FROM ' + current_mappings_table_name + ';' ).fetchone()

                    results[ HC.SERVICE_INFO_NUM_FILES ] = num_files
                    results[ HC.SERVICE_INFO_NUM_TAGS ] = num_tags

                    self._c.execute( 'INSERT INTO service_info ( service_id, info_type, info ) VALUES ( ?, ?, ? );', ( service_id, HC.SERVICE_INFO_NUM_FILES, num_files ) )
                    self._c.execute( 'INSERT INTO service_info ( service_id, info_type, info ) VALUES ( ?, ?, ? );', ( service_id, HC.SERVICE_INFO_NUM_TAGS, num_tags ) )

                    info_types_missed.difference_update( common_tag_info_types )


            for info_type in info_types_missed:

                save_it = True

                if service_type in HC.FILE_SERVICES:

                    if info_type in ( HC.SERVICE_INFO_NUM_PENDING_FILES, HC.SERVICE_INFO_NUM_PETITIONED_FILES ): save_it = False

                    if info_type == HC.SERVICE_INFO_NUM_FILES: result = self._c.execute( 'SELECT COUNT( * ) FROM current_files WHERE service_id = ?;', ( service_id, ) ).fetchone()
                    elif info_type == HC.SERVICE_INFO_TOTAL_SIZE: result = self._c.execute( 'SELECT SUM( size ) FROM current_files, files_info USING ( hash_id ) WHERE service_id = ?;', ( service_id, ) ).fetchone()
                    elif info_type == HC.SERVICE_INFO_NUM_DELETED_FILES: result = self._c.execute( 'SELECT COUNT( * ) FROM deleted_files WHERE service_id = ?;', ( service_id, ) ).fetchone()
                    elif info_type == HC.SERVICE_INFO_NUM_PENDING_FILES: result = self._c.execute( 'SELECT COUNT( * ) FROM file_transfers WHERE service_id = ?;', ( service_id, ) ).fetchone()
                    elif info_type == HC.SERVICE_INFO_NUM_PETITIONED_FILES: result = self._c.execute( 'SELECT COUNT( * ) FROM file_petitions where service_id = ?;', ( service_id, ) ).fetchone()
                    elif info_type == HC.SERVICE_INFO_NUM_INBOX: result = self._c.execute( 'SELECT COUNT( * ) FROM file_inbox, current_files USING ( hash_id ) WHERE service_id = ?;', ( service_id, ) ).fetchone()

                elif service_type in HC.TAG_SERVICES:

                    ( current_mappings_table_name, deleted_mappings_table_name, pending_mappings_table_name, petitioned_mappings_table_name ) = GenerateMappingsTableNames( service_id )

                    if info_type in ( HC.SERVICE_INFO_NUM_PENDING_TAG_SIBLINGS, HC.SERVICE_INFO_NUM_PETITIONED_TAG_SIBLINGS, HC.SERVICE_INFO_NUM_PENDING_TAG_PARENTS, HC.SERVICE_INFO_NUM_PETITIONED_TAG_PARENTS ): save_it = False

                    if info_type == HC.SERVICE_INFO_NUM_FILES: result = self._c.execute( 'SELECT COUNT( DISTINCT hash_id ) FROM ' + current_mappings_table_name + ';' ).fetchone()
                    elif info_type == HC.SERVICE_INFO_NUM_TAGS: result = self._c.execute( 'SELECT COUNT( DISTINCT tag_id ) FROM ' + current_mappings_table_name + ';' ).fetchone()
                    elif info_type == HC.SERVICE_INFO_NUM_MAPPINGS: result = self._c.execute( 'SELECT COUNT( * ) FROM ' + current_mappings_table_name + ';' ).fetchone()
                    elif info_type == HC.SERVICE_INFO_NUM_DELETED_MAPPINGS: result = self._c.execute( 'SELECT COUNT( * ) FROM ' + deleted_mappings_table_name + ';' ).fetchone()
                    elif info_type == HC.SERVICE_INFO_NUM_PENDING_MAPPINGS: result = self._c.execute( 'SELECT COUNT( * ) FROM ' + pending_mappings_table_name + ';' ).fetchone()
                    elif info_type == HC.SERVICE_INFO_NUM_PETITIONED_MAPPINGS: result = self._c.execute( 'SELECT COUNT( * ) FROM ' + petitioned_mappings_table_name + ';' ).fetchone()
                    elif info_type == HC.SERVICE_INFO_NUM_PENDING_TAG_SIBLINGS: result = self._c.execute( 'SELECT COUNT( * ) FROM tag_sibling_petitions WHERE service_id = ? AND status = ?;', ( service_id, HC.PENDING ) ).fetchone()
                    elif info_type == HC.SERVICE_INFO_NUM_PETITIONED_TAG_SIBLINGS: result = self._c.execute( 'SELECT COUNT( * ) FROM tag_sibling_petitions WHERE service_id = ? AND status = ?;', ( service_id, HC.PETITIONED ) ).fetchone()
                    elif info_type == HC.SERVICE_INFO_NUM_PENDING_TAG_PARENTS: result = self._c.execute( 'SELECT COUNT( * ) FROM tag_parent_petitions WHERE service_id = ? AND status = ?;', ( service_id, HC.PENDING ) ).fetchone()
                    elif info_type == HC.SERVICE_INFO_NUM_PETITIONED_TAG_PARENTS: result = self._c.execute( 'SELECT COUNT( * ) FROM tag_parent_petitions WHERE service_id = ? AND status = ?;', ( service_id, HC.PETITIONED ) ).fetchone()

                elif service_type in ( HC.LOCAL_RATING_LIKE, HC.LOCAL_RATING_NUMERICAL ):

                    if info_type == HC.SERVICE_INFO_NUM_FILES: result = self._c.execute( 'SELECT COUNT( * ) FROM local_ratings WHERE service_id = ?;', ( service_id, ) ).fetchone()

                elif service_type == HC.LOCAL_BOORU:

                    if info_type == HC.SERVICE_INFO_NUM_SHARES: result = self._c.execute( 'SELECT COUNT( * ) FROM yaml_dumps WHERE dump_type = ?;', ( YAML_DUMP_ID_LOCAL_BOORU, ) ).fetchone()


                if result is None: info = 0
                else: ( info, ) = result

                if info is None: info = 0

                if save_it:

                    self._c.execute( 'INSERT INTO service_info ( service_id, info_type, info ) VALUES ( ?, ?, ? );', ( service_id, info_type, info ) )


                results[ info_type ] = info


        return results


    def _GetSiteId( self, name ):

        result = self._c.execute( 'SELECT site_id FROM imageboard_sites WHERE name = ?;', ( name, ) ).fetchone()

        if result is None:

            self._c.execute( 'INSERT INTO imageboard_sites ( name ) VALUES ( ? );', ( name, ) )

            site_id = self._c.lastrowid

        else: ( site_id, ) = result

        return site_id


    def _GetTagCensorship( self, service_key = None ):

        if service_key is None:

            result = []

            for ( service_id, blacklist, tags ) in self._c.execute( 'SELECT service_id, blacklist, tags FROM tag_censorship;' ).fetchall():

                service = self._GetService( service_id )

                service_key = service.GetServiceKey()

                result.append( ( service_key, blacklist, tags ) )


        else:

            service_id = self._GetServiceId( service_key )

            result = self._c.execute( 'SELECT blacklist, tags FROM tag_censorship WHERE service_id = ?;', ( service_id, ) ).fetchone()

            if result is None: result = ( True, [] )


        return result


    def _GetTagParents( self, service_key = None ):

        tag_censorship_manager = self._controller.GetManager( 'tag_censorship' )

        if service_key is None:

            service_ids_to_statuses_and_pair_ids = HydrusData.BuildKeyToListDict( ( ( service_id, ( status, child_namespace_id, child_tag_id, parent_namespace_id, parent_tag_id ) ) for ( service_id, child_namespace_id, child_tag_id, parent_namespace_id, parent_tag_id, status ) in self._c.execute( 'SELECT service_id, child_namespace_id, child_tag_id, parent_namespace_id, parent_tag_id, status FROM tag_parents UNION SELECT service_id, child_namespace_id, child_tag_id, parent_namespace_id, parent_tag_id, status FROM tag_parent_petitions;' ) ) )

            service_keys_to_statuses_to_pairs = collections.defaultdict( HydrusData.default_dict_set )

            for ( service_id, statuses_and_pair_ids ) in service_ids_to_statuses_and_pair_ids.items():

                service = self._GetService( service_id )

                service_key = service.GetServiceKey()

                statuses_to_pairs = HydrusData.BuildKeyToSetDict( ( ( status, ( self._GetNamespaceTag( child_namespace_id, child_tag_id ), self._GetNamespaceTag( parent_namespace_id, parent_tag_id ) ) ) for ( status, child_namespace_id, child_tag_id, parent_namespace_id, parent_tag_id ) in statuses_and_pair_ids ) )

                statuses_to_pairs = tag_censorship_manager.FilterStatusesToPairs( service_key, statuses_to_pairs )

                service_keys_to_statuses_to_pairs[ service_key ] = statuses_to_pairs


            return service_keys_to_statuses_to_pairs

        else:

            service_id = self._GetServiceId( service_key )

            statuses_and_pair_ids = self._c.execute( 'SELECT child_namespace_id, child_tag_id, parent_namespace_id, parent_tag_id, status FROM tag_parents WHERE service_id = ? UNION SELECT child_namespace_id, child_tag_id, parent_namespace_id, parent_tag_id, status FROM tag_parent_petitions WHERE service_id = ?;', ( service_id, service_id ) ).fetchall()

            statuses_to_pairs = HydrusData.BuildKeyToSetDict( ( ( status, ( self._GetNamespaceTag( child_namespace_id, child_tag_id ), self._GetNamespaceTag( parent_namespace_id, parent_tag_id ) ) ) for ( child_namespace_id, child_tag_id, parent_namespace_id, parent_tag_id, status ) in statuses_and_pair_ids ) )

            statuses_to_pairs = tag_censorship_manager.FilterStatusesToPairs( service_key, statuses_to_pairs )

            return statuses_to_pairs


    def _GetTagSiblings( self, service_key = None ):

        tag_censorship_manager = self._controller.GetManager( 'tag_censorship' )

        if service_key is None:

            service_ids_to_statuses_and_pair_ids = HydrusData.BuildKeyToListDict( ( ( service_id, ( status, old_namespace_id, old_tag_id, new_namespace_id, new_tag_id ) ) for ( service_id, old_namespace_id, old_tag_id, new_namespace_id, new_tag_id, status ) in self._c.execute( 'SELECT service_id, old_namespace_id, old_tag_id, new_namespace_id, new_tag_id, status FROM tag_siblings UNION SELECT service_id, old_namespace_id, old_tag_id, new_namespace_id, new_tag_id, status FROM tag_sibling_petitions;' ) ) )

            service_keys_to_statuses_to_pairs = collections.defaultdict( HydrusData.default_dict_set )

            for ( service_id, statuses_and_pair_ids ) in service_ids_to_statuses_and_pair_ids.items():

                service = self._GetService( service_id )

                service_key = service.GetServiceKey()

                statuses_to_pairs = HydrusData.BuildKeyToSetDict( ( ( status, ( self._GetNamespaceTag( old_namespace_id, old_tag_id ), self._GetNamespaceTag( new_namespace_id, new_tag_id ) ) ) for ( status, old_namespace_id, old_tag_id, new_namespace_id, new_tag_id ) in statuses_and_pair_ids ) )

                statuses_to_pairs = tag_censorship_manager.FilterStatusesToPairs( service_key, statuses_to_pairs )

                service_keys_to_statuses_to_pairs[ service_key ] = statuses_to_pairs


            return service_keys_to_statuses_to_pairs

        else:

            service_id = self._GetServiceId( service_key )

            statuses_and_pair_ids = self._c.execute( 'SELECT old_namespace_id, old_tag_id, new_namespace_id, new_tag_id, status FROM tag_siblings WHERE service_id = ? UNION SELECT old_namespace_id, old_tag_id, new_namespace_id, new_tag_id, status FROM tag_sibling_petitions WHERE service_id = ?;', ( service_id, service_id ) ).fetchall()

            statuses_to_pairs = HydrusData.BuildKeyToSetDict( ( ( status, ( self._GetNamespaceTag( old_namespace_id, old_tag_id ), self._GetNamespaceTag( new_namespace_id, new_tag_id ) ) ) for ( old_namespace_id, old_tag_id, new_namespace_id, new_tag_id, status ) in statuses_and_pair_ids ) )

            statuses_to_pairs = tag_censorship_manager.FilterStatusesToPairs( service_key, statuses_to_pairs )

            return statuses_to_pairs


    def _GetText( self, text_id ):

        result = self._c.execute( 'SELECT text FROM texts WHERE text_id = ?;', ( text_id, ) ).fetchone()

        if result is None:

            raise HydrusExceptions.DataMissing( 'Text lookup error in database' )


        ( text, ) = result

        return text


    def _GetTextId( self, text ):

        result = self._c.execute( 'SELECT text_id FROM texts WHERE text = ?;', ( text, ) ).fetchone()

        if result is None:

            self._c.execute( 'INSERT INTO texts ( text ) VALUES ( ? );', ( text, ) )

            text_id = self._c.lastrowid

        else:

            ( text_id, ) = result


        return text_id


    def _GetTrashHashes( self, limit = None, minimum_age = None ):

        if limit is None:

            limit_phrase = ''

        else:

            limit_phrase = ' LIMIT ' + str( limit )


        if minimum_age is None:

            age_phrase = ''

        else:

            timestamp_cutoff = HydrusData.GetNow() - minimum_age

            age_phrase = ' AND timestamp < ' + str( timestamp_cutoff ) + ' ORDER BY timestamp ASC'


        hash_ids = { hash_id for ( hash_id, ) in self._c.execute( 'SELECT hash_id FROM current_files WHERE service_id = ?' + age_phrase + limit_phrase + ';', ( self._trash_service_id, ) ) }

        if HydrusGlobals.db_report_mode:

            message = 'When asked for '

            if limit is None:

                message += 'all the'

            else:

                message += 'at most ' + HydrusData.ConvertIntToPrettyString( limit )


            message += ' trash files,'

            if minimum_age is not None:

                message += ' with minimum age ' + HydrusData.ConvertTimestampToPrettyAge( timestamp_cutoff ) + ','


            message += ' I found ' + HydrusData.ConvertIntToPrettyString( len( hash_ids ) ) + '.'

            HydrusData.ShowText( message )


        return self._GetHashes( hash_ids )


    def _GetURLStatus( self, url ):

        result = self._c.execute( 'SELECT hash_id FROM urls WHERE url = ?;', ( url, ) ).fetchone()

        if result is None:

            return ( CC.STATUS_NEW, None )

        else:

            ( hash_id, ) = result

            return self._GetHashIdStatus( hash_id )


    def _GetWebSessions( self ):

        now = HydrusData.GetNow()

        self._c.execute( 'DELETE FROM web_sessions WHERE ? > expiry;', ( now, ) )

        sessions = []

        sessions = self._c.execute( 'SELECT name, cookies, expiry FROM web_sessions;' ).fetchall()

        return sessions


    def _GetYAMLDump( self, dump_type, dump_name = None ):

        if dump_name is None:

            result = { dump_name : data for ( dump_name, data ) in self._c.execute( 'SELECT dump_name, dump FROM yaml_dumps WHERE dump_type = ?;', ( dump_type, ) ) }

            if dump_type == YAML_DUMP_ID_LOCAL_BOORU:

                result = { dump_name.decode( 'hex' ) : data for ( dump_name, data ) in result.items() }


        else:

            if dump_type == YAML_DUMP_ID_SUBSCRIPTION and dump_name in self._subscriptions_cache: return self._subscriptions_cache[ dump_name ]

            if dump_type == YAML_DUMP_ID_LOCAL_BOORU: dump_name = dump_name.encode( 'hex' )

            result = self._c.execute( 'SELECT dump FROM yaml_dumps WHERE dump_type = ? AND dump_name = ?;', ( dump_type, dump_name ) ).fetchone()

            if result is None:

                if result is None:

                    raise HydrusExceptions.DataMissing( dump_name + ' was not found!' )


            else: ( result, ) = result

            if dump_type == YAML_DUMP_ID_SUBSCRIPTION: self._subscriptions_cache[ dump_name ] = result


        return result


    def _GetYAMLDumpNames( self, dump_type ):

        names = [ name for ( name, ) in self._c.execute( 'SELECT dump_name FROM yaml_dumps WHERE dump_type = ?;', ( dump_type, ) ) ]

        if dump_type == YAML_DUMP_ID_LOCAL_BOORU:

            names = [ name.decode( 'hex' ) for name in names ]


        return names


    def _HashExists( self, hash ):

        result = self._c.execute( 'SELECT hash_id FROM hashes WHERE hash = ?;', ( sqlite3.Binary( hash ), ) ).fetchone()

        if result is None:

            return False

        else:

            return True


    def _ImportFile( self, temp_path, import_file_options = None, override_deleted = False, url = None ):

        if import_file_options is None:

            import_file_options = ClientDefaults.GetDefaultImportFileOptions()


        ( archive, exclude_deleted_files, min_size, min_resolution ) = import_file_options.ToTuple()

        HydrusImageHandling.ConvertToPngIfBmp( temp_path )

        hash = HydrusFileHandling.GetHashFromPath( temp_path )

        hash_id = self._GetHashId( hash )

        if url is not None:

            self._c.execute( 'INSERT OR IGNORE INTO urls ( url, hash_id ) VALUES ( ?, ? );', ( url, hash_id ) )


        ( status, status_hash ) = self._GetHashIdStatus( hash_id )

        if status == CC.STATUS_DELETED:

            if override_deleted or not exclude_deleted_files:

                status = CC.STATUS_NEW


        if status == CC.STATUS_REDUNDANT:

            if archive:

                self._ArchiveFiles( ( hash_id, ) )

                self.pub_content_updates_after_commit( { CC.COMBINED_LOCAL_FILE_SERVICE_KEY : [ HydrusData.ContentUpdate( HC.CONTENT_TYPE_FILES, HC.CONTENT_UPDATE_ARCHIVE, set( ( hash, ) ) ) ] } )


        elif status == CC.STATUS_NEW:

            mime = HydrusFileHandling.GetMime( temp_path )

            ( size, mime, width, height, duration, num_frames, num_words ) = HydrusFileHandling.GetFileInfo( temp_path )

            if width is not None and height is not None:

                if min_resolution is not None:

                    ( min_x, min_y ) = min_resolution

                    if width < min_x or height < min_y:

                        raise Exception( 'Resolution too small' )


            if min_size is not None:

                if size < min_size:

                    raise Exception( 'File too small' )


            timestamp = HydrusData.GetNow()

            client_files_manager = self._controller.GetClientFilesManager()

            if mime in HC.MIMES_WITH_THUMBNAILS:

                thumbnail = HydrusFileHandling.GenerateThumbnail( temp_path )

                # lockless because this db call is made by the locked client files manager
                client_files_manager.LocklessAddFullSizeThumbnail( hash, thumbnail )


            if mime in HC.MIMES_WE_CAN_PHASH:

                phashes = ClientImageHandling.GenerateShapePerceptualHashes( temp_path )

                self._CacheSimilarFilesAssociatePHashes( hash_id, phashes )


            # lockless because this db call is made by the locked client files manager
            client_files_manager.LocklessAddFile( hash, mime, temp_path )

            self._AddFilesInfo( [ ( hash_id, size, mime, width, height, duration, num_frames, num_words ) ], overwrite = True )

            self._AddFiles( self._local_file_service_id, [ ( hash_id, timestamp ) ] )

            content_update = HydrusData.ContentUpdate( HC.CONTENT_TYPE_FILES, HC.CONTENT_UPDATE_ADD, ( hash, size, mime, timestamp, width, height, duration, num_frames, num_words ) )

            self.pub_content_updates_after_commit( { CC.LOCAL_FILE_SERVICE_KEY : [ content_update ] } )

            ( md5, sha1, sha512 ) = HydrusFileHandling.GetExtraHashesFromPath( temp_path )

            self._c.execute( 'INSERT OR IGNORE INTO local_hashes ( hash_id, md5, sha1, sha512 ) VALUES ( ?, ?, ?, ? );', ( hash_id, sqlite3.Binary( md5 ), sqlite3.Binary( sha1 ), sqlite3.Binary( sha512 ) ) )

            if archive:

                self._ArchiveFiles( ( hash_id, ) )

            else:

                self._InboxFiles( ( hash_id, ) )


            status = CC.STATUS_SUCCESSFUL


        tag_services = self._GetServices( HC.TAG_SERVICES )

        for service in tag_services:

            service_key = service.GetServiceKey()
            info = service.GetInfo()

            tag_archive_sync = info[ 'tag_archive_sync' ]

            for ( portable_hta_path, namespaces ) in tag_archive_sync.items():

                hta_path = HydrusPaths.ConvertPortablePathToAbsPath( portable_hta_path )

                adding = True

                try: self._SyncHashesToTagArchive( [ hash ], hta_path, service_key, adding, namespaces )
                except: pass


        return ( status, hash )


    def _InboxFiles( self, hash_ids ):

        self._c.executemany( 'INSERT OR IGNORE INTO file_inbox VALUES ( ? );', ( ( hash_id, ) for hash_id in hash_ids ) )

        num_added = self._GetRowCount()

        if num_added > 0:

            splayed_hash_ids = HydrusData.SplayListForDB( hash_ids )

            updates = self._c.execute( 'SELECT service_id, COUNT( * ) FROM current_files WHERE hash_id IN ' + splayed_hash_ids + ' GROUP BY service_id;' ).fetchall()

            self._c.executemany( 'UPDATE service_info SET info = info + ? WHERE service_id = ? AND info_type = ?;', [ ( count, service_id, HC.SERVICE_INFO_NUM_INBOX ) for ( service_id, count ) in updates ] )

            self._inbox_hash_ids.update( hash_ids )


    def _InitCaches( self ):

        new_options = self._GetJSONDump( HydrusSerialisable.SERIALISABLE_TYPE_CLIENT_OPTIONS )

        disk_cache_init_period = new_options.GetNoneableInteger( 'disk_cache_init_period' )

        if disk_cache_init_period is not None:

            HydrusGlobals.client_controller.pub( 'splash_set_status_text', 'preparing disk cache' )

            stop_time = HydrusData.GetNow() + disk_cache_init_period

            self._LoadIntoDiskCache( stop_time = stop_time )


        HydrusGlobals.client_controller.pub( 'splash_set_status_text', 'preparing db caches' )

        self._local_file_service_id = self._GetServiceId( CC.LOCAL_FILE_SERVICE_KEY )
        self._trash_service_id = self._GetServiceId( CC.TRASH_SERVICE_KEY )
        self._combined_local_file_service_id = self._GetServiceId( CC.COMBINED_LOCAL_FILE_SERVICE_KEY )
        self._local_tag_service_id = self._GetServiceId( CC.LOCAL_TAG_SERVICE_KEY )
        self._combined_file_service_id = self._GetServiceId( CC.COMBINED_FILE_SERVICE_KEY )
        self._combined_tag_service_id = self._GetServiceId( CC.COMBINED_TAG_SERVICE_KEY )

        self._subscriptions_cache = {}
        self._service_cache = {}

        ( self._null_namespace_id, ) = self._c.execute( 'SELECT namespace_id FROM namespaces WHERE namespace = ?;', ( '', ) ).fetchone()

        self._inbox_hash_ids = { id for ( id, ) in self._c.execute( 'SELECT hash_id FROM file_inbox;' ) }


    def _InitExternalDatabases( self ):

        self._db_filenames[ 'external_caches' ] = 'client.caches.db'
        self._db_filenames[ 'external_mappings' ] = 'client.mappings.db'
        self._db_filenames[ 'external_master' ] = 'client.master.db'


    def _IsAnOrphan( self, test_type, possible_hash ):

        if self._HashExists( possible_hash ):

            hash = possible_hash

            if test_type == 'file':

                hash_id = self._GetHashId( hash )

                result = self._c.execute( 'SELECT 1 FROM current_files WHERE service_id = ? AND hash_id = ?;', ( self._combined_local_file_service_id, hash_id ) ).fetchone()

                if result is None:

                    return True

                else:

                    return False


            elif test_type == 'thumbnail':

                hash_id = self._GetHashId( hash )

                result = self._c.execute( 'SELECT 1 FROM current_files WHERE hash_id = ?;', ( hash_id, ) ).fetchone()

                if result is None:

                    return True

                else:

                    return False


        else:

            return True


    def _LoadIntoDiskCache( self, stop_time = None, caller_limit = None ):

        self._CloseDBCursor()

        try:

            approx_disk_cache_size = psutil.virtual_memory().available * 4 / 5

            disk_cache_limit = approx_disk_cache_size * 2 / 3

        except psutil.Error:

            disk_cache_limit = 512 * 1024 * 1024


        so_far_read = 0

        try:

            paths = [ os.path.join( self._db_dir, filename ) for filename in self._db_filenames.values() ]

            paths.sort( key = os.path.getsize )

            for path in paths:

                with open( path, 'rb' ) as f:

                    while f.read( HC.READ_BLOCK_SIZE ) != '':

                        if stop_time is not None and HydrusData.TimeHasPassed( stop_time ):

                            return False


                        so_far_read += HC.READ_BLOCK_SIZE

                        if so_far_read > disk_cache_limit:

                            return True


                        if caller_limit is not None and so_far_read > caller_limit:

                            return False


        finally:

            self._InitDBCursor()


        return True


    def _MaintenanceDue( self, stop_time ):

        # vacuum

        new_options = self._controller.GetNewOptions()

        maintenance_vacuum_period_days = new_options.GetNoneableInteger( 'maintenance_vacuum_period_days' )

        if maintenance_vacuum_period_days is not None:

            stale_time_delta = maintenance_vacuum_period_days * 86400

            existing_names_to_timestamps = dict( self._c.execute( 'SELECT name, timestamp FROM vacuum_timestamps;' ).fetchall() )

            db_names = [ name for ( index, name, path ) in self._c.execute( 'PRAGMA database_list;' ) if name not in ( 'mem', 'temp' ) ]

            due_names = { name for name in db_names if name not in existing_names_to_timestamps or HydrusData.TimeHasPassed( existing_names_to_timestamps[ name ] + stale_time_delta ) }

            possible_due_names = set()

            if len( due_names ) > 0:

                self._CloseDBCursor()

                try:

                    for name in due_names:

                        db_path = os.path.join( self._db_dir, self._db_filenames[ name ] )

                        if HydrusDB.CanVacuum( db_path, stop_time = stop_time ):

                            possible_due_names.add( name )


                    if len( possible_due_names ) > 0:

                        return True


                finally:

                    self._InitDBCursor()


        # analyze

        names_to_analyze = self._GetBigTableNamesToAnalyze()

        if len( names_to_analyze ) > 0:

            return True


        return self._CacheSimilarFilesMaintenanceDue()


    def _ManageDBError( self, job, e ):

        if isinstance( e, MemoryError ):

            HydrusData.ShowText( 'The client is running out of memory! Restart it ASAP!' )


        if job.IsSynchronous():

            db_traceback = 'Database ' + traceback.format_exc()

            first_line = HydrusData.ToUnicode( type( e ).__name__ ) + ': ' + HydrusData.ToUnicode( e )

            new_e = HydrusExceptions.DBException( first_line, db_traceback )

            job.PutResult( new_e )

        else:

            HydrusData.ShowException( e )


    def _OverwriteJSONDumps( self, dump_types, objs ):

        for dump_type in dump_types:

            self._DeleteJSONDumpNamed( dump_type )


        for obj in objs:

            self._SetJSONDump( obj )


    def _ProcessContentUpdatePackage( self, service_key, content_update_package, job_key ):

        ( previous_journal_mode, ) = self._c.execute( 'PRAGMA journal_mode;' ).fetchone()

        if previous_journal_mode == 'wal' and not self._fast_big_transaction_wal:

            self._c.execute( 'COMMIT;' )

            self._c.execute( 'PRAGMA journal_mode = TRUNCATE;' )

            self._c.execute( 'BEGIN IMMEDIATE;' )


        c_u_p_num_rows = content_update_package.GetNumRows()
        c_u_p_total_weight_processed = 0

        update_speed_string = u'writing\u2026'

        content_update_index_string = 'content row ' + HydrusData.ConvertValueRangeToPrettyString( c_u_p_total_weight_processed, c_u_p_num_rows ) + ': '

        quit_early = False

        package_precise_timestamp = HydrusData.GetNowPrecise()

        for ( content_updates, weight ) in content_update_package.IterateContentUpdateChunks():

            options = self._controller.GetOptions()

            if options[ 'pause_repo_sync' ]:

                quit_early = True


            ( i_paused, should_quit ) = job_key.WaitIfNeeded()

            if should_quit:

                quit_early = True


            if quit_early:

                package_took = HydrusData.GetNowPrecise() - package_precise_timestamp

                rows_s = c_u_p_total_weight_processed / package_took

                committing_string = 'wrote ' + HydrusData.ConvertIntToPrettyString( c_u_p_num_rows ) + ' rows at ' + HydrusData.ConvertIntToPrettyString( rows_s ) + ' rows/s - now committing to disk'

                job_key.SetVariable( 'popup_text_2', committing_string )

                HydrusData.Print( job_key.ToString() )

                if previous_journal_mode == 'wal' and not self._fast_big_transaction_wal:

                    self._c.execute( 'COMMIT;' )

                    self._c.execute( 'PRAGMA journal_mode = WAL;' )

                    self._c.execute( 'BEGIN IMMEDIATE;' )


                return ( False, c_u_p_total_weight_processed )


            content_update_index_string = 'content row ' + HydrusData.ConvertValueRangeToPrettyString( c_u_p_total_weight_processed, c_u_p_num_rows ) + ': '

            self._controller.pub( 'splash_set_status_text', content_update_index_string + update_speed_string, print_to_log = False )
            job_key.SetVariable( 'popup_text_2', content_update_index_string + update_speed_string )

            job_key.SetVariable( 'popup_gauge_2', ( c_u_p_total_weight_processed, c_u_p_num_rows ) )

            chunk_precise_timestamp = HydrusData.GetNowPrecise()

            self._ProcessContentUpdates( { service_key : content_updates }, do_pubsubs = False )

            chunk_took = HydrusData.GetNowPrecise() - chunk_precise_timestamp

            rows_s = weight / chunk_took

            update_speed_string = 'writing at ' + HydrusData.ConvertIntToPrettyString( rows_s ) + ' rows/s'

            c_u_p_total_weight_processed += weight


        package_took = HydrusData.GetNowPrecise() - package_precise_timestamp

        rows_s = c_u_p_total_weight_processed / package_took

        committing_string = 'wrote ' + HydrusData.ConvertIntToPrettyString( c_u_p_num_rows ) + ' rows at ' + HydrusData.ConvertIntToPrettyString( rows_s ) + ' rows/s - now committing to disk'

        self._controller.pub( 'splash_set_status_text', committing_string )
        job_key.SetVariable( 'popup_text_2', committing_string )

        job_key.SetVariable( 'popup_gauge_2', ( c_u_p_num_rows, c_u_p_num_rows ) )

        HydrusData.Print( job_key.ToString() )

        if previous_journal_mode == 'wal' and not self._fast_big_transaction_wal:

            self._c.execute( 'COMMIT;' )

            self._c.execute( 'PRAGMA journal_mode = WAL;' )

            self._c.execute( 'BEGIN IMMEDIATE;' )


        return ( True, c_u_p_total_weight_processed )


    def _ProcessContentUpdates( self, service_keys_to_content_updates, do_pubsubs = True ):

        notify_new_downloads = False
        notify_new_pending = False
        notify_new_parents = False
        notify_new_siblings = False

        for ( service_key, content_updates ) in service_keys_to_content_updates.items():

            try:

                service_id = self._GetServiceId( service_key )

            except HydrusExceptions.DataMissing:

                continue


            service = self._GetService( service_id )

            service_type = service.GetServiceType()

            ultimate_mappings_ids = []
            ultimate_deleted_mappings_ids = []

            ultimate_pending_mappings_ids = []
            ultimate_pending_rescinded_mappings_ids = []

            ultimate_petitioned_mappings_ids = []
            ultimate_petitioned_rescinded_mappings_ids = []

            for content_update in content_updates:

                ( data_type, action, row ) = content_update.ToTuple()

                if service_type in HC.FILE_SERVICES:

                    if data_type == HC.CONTENT_TYPE_FILES:

                        if action == HC.CONTENT_UPDATE_ADVANCED:

                            ( sub_action, sub_row ) = row

                            if sub_action == 'delete_deleted':

                                self._c.execute( 'DELETE FROM deleted_files WHERE service_id = ?;', ( service_id, ) )


                            self._c.execute( 'DELETE FROM service_info WHERE service_id = ?;', ( service_id, ) )

                        elif action == HC.CONTENT_UPDATE_ADD:

                            if service_type in HC.LOCAL_FILE_SERVICES or service_type == HC.FILE_REPOSITORY:

                                ( hash, size, mime, timestamp, width, height, duration, num_frames, num_words ) = row

                                hash_id = self._GetHashId( hash )

                                self._AddFilesInfo( [ ( hash_id, size, mime, width, height, duration, num_frames, num_words ) ] )

                            elif service_type == HC.IPFS:

                                ( hash, multihash ) = row

                                hash_id = self._GetHashId( hash )

                                self._SetServiceFilename( service_id, hash_id, multihash )

                                timestamp = HydrusData.GetNow()


                            self._AddFiles( service_id, [ ( hash_id, timestamp ) ] )

                        elif action == HC.CONTENT_UPDATE_PEND:

                            hashes = row

                            hash_ids = self._GetHashIds( hashes )

                            self._c.executemany( 'INSERT OR IGNORE INTO file_transfers ( service_id, hash_id ) VALUES ( ?, ? );', [ ( service_id, hash_id ) for hash_id in hash_ids ] )

                            if service_key == CC.COMBINED_LOCAL_FILE_SERVICE_KEY: notify_new_downloads = True
                            else: notify_new_pending = True

                        elif action == HC.CONTENT_UPDATE_PETITION:

                            ( hashes, reason ) = row

                            hash_ids = self._GetHashIds( hashes )

                            reason_id = self._GetTextId( reason )

                            self._c.execute( 'DELETE FROM file_petitions WHERE service_id = ? AND hash_id IN ' + HydrusData.SplayListForDB( hash_ids ) + ';', ( service_id, ) )

                            self._c.executemany( 'INSERT OR IGNORE INTO file_petitions ( service_id, hash_id, reason_id ) VALUES ( ?, ?, ? );', [ ( service_id, hash_id, reason_id ) for hash_id in hash_ids ] )

                            notify_new_pending = True

                        elif action == HC.CONTENT_UPDATE_RESCIND_PEND:

                            hashes = row

                            hash_ids = self._GetHashIds( hashes )

                            self._c.execute( 'DELETE FROM file_transfers WHERE service_id = ? AND hash_id IN ' + HydrusData.SplayListForDB( hash_ids ) + ';', ( service_id, ) )

                            notify_new_pending = True

                        elif action == HC.CONTENT_UPDATE_RESCIND_PETITION:

                            hashes = row

                            hash_ids = self._GetHashIds( hashes )

                            self._c.execute( 'DELETE FROM file_petitions WHERE service_id = ? AND hash_id IN ' + HydrusData.SplayListForDB( hash_ids ) + ';', ( service_id, ) )

                            notify_new_pending = True

                        else:

                            hashes = row

                            hash_ids = self._GetHashIds( hashes )

                            if action == HC.CONTENT_UPDATE_ARCHIVE: self._ArchiveFiles( hash_ids )
                            elif action == HC.CONTENT_UPDATE_INBOX: self._InboxFiles( hash_ids )
                            elif action == HC.CONTENT_UPDATE_DELETE:

                                deleted_hash_ids = self._DeleteFiles( service_id, hash_ids )

                                if service_id == self._trash_service_id:

                                    self._DeleteFiles( self._combined_local_file_service_id, deleted_hash_ids )


                            elif action == HC.CONTENT_UPDATE_UNDELETE:

                                splayed_hash_ids = HydrusData.SplayListForDB( hash_ids )

                                rows = self._c.execute( 'SELECT hash_id, timestamp FROM current_files WHERE service_id = ? AND hash_id IN ' + splayed_hash_ids + ';', ( self._combined_local_file_service_id, ) ).fetchall()

                                self._AddFiles( self._local_file_service_id, rows )


                    elif data_type == HC.CONTENT_TYPE_DIRECTORIES:

                        if action == HC.CONTENT_UPDATE_ADD:

                            ( hashes, dirname, note ) = row

                            hash_ids = self._GetHashIds( hashes )

                            self._SetServiceDirectory( service_id, hash_ids, dirname, note )

                        elif action == HC.CONTENT_UPDATE_DELETE:

                            dirname = row

                            self._DeleteServiceDirectory( service_id, dirname )


                elif service_type in HC.TAG_SERVICES:

                    if data_type == HC.CONTENT_TYPE_MAPPINGS:

                        if action == HC.CONTENT_UPDATE_ADVANCED:

                            ( sub_action, sub_row ) = row

                            if sub_action in ( 'copy', 'delete', 'delete_deleted' ):

                                self._c.execute( 'CREATE TEMPORARY TABLE temp_operation ( job_id INTEGER PRIMARY KEY AUTOINCREMENT, namespace_id INTEGER, tag_id INTEGER, hash_id INTEGER );' )

                                ( current_mappings_table_name, deleted_mappings_table_name, pending_mappings_table_name, petitioned_mappings_table_name ) = GenerateMappingsTableNames( service_id )

                                if sub_action == 'copy':

                                    ( tag, hashes, service_key_target ) = sub_row

                                    source_table_name = current_mappings_table_name

                                elif sub_action == 'delete':

                                    ( tag, hashes ) = sub_row

                                    source_table_name = current_mappings_table_name

                                elif sub_action == 'delete_deleted':

                                    ( tag, hashes ) = sub_row

                                    source_table_name = deleted_mappings_table_name


                                predicates = []

                                if tag is not None:

                                    ( tag_type, tag ) = tag

                                    if tag_type == 'tag':

                                        try: ( namespace_id, tag_id ) = self._GetNamespaceIdTagId( tag )
                                        except HydrusExceptions.SizeException: continue

                                        predicates.append( 'namespace_id = ' + str( namespace_id ) )
                                        predicates.append( 'tag_id = ' + str( tag_id ) )

                                    elif tag_type == 'namespace':

                                        namespace_id = self._GetNamespaceId( tag )

                                        predicates.append( 'namespace_id = ' + str( namespace_id ) )

                                    elif tag_type == 'namespaced':

                                        predicates.append( 'namespace_id != ' + str( self._null_namespace_id ) )

                                    elif tag_type == 'unnamespaced':

                                        predicates.append( 'namespace_id = ' + str( self._null_namespace_id ) )


                                if hashes is not None:

                                    hash_ids = self._GetHashIds( hashes )

                                    predicates.append( 'hash_id IN ' + HydrusData.SplayListForDB( hash_ids ) )


                                if len( predicates ) == 0:

                                    self._c.execute( 'INSERT INTO temp_operation ( namespace_id, tag_id, hash_id ) SELECT namespace_id, tag_id, hash_id FROM ' + source_table_name + ';' )

                                else:

                                    self._c.execute( 'INSERT INTO temp_operation ( namespace_id, tag_id, hash_id ) SELECT namespace_id, tag_id, hash_id FROM ' + source_table_name + ' WHERE ' + ' AND '.join( predicates ) + ';' )


                                num_to_do = self._GetRowCount()

                                i = 0

                                block_size = 1000

                                while i < num_to_do:

                                    advanced_mappings_ids = self._c.execute( 'SELECT namespace_id, tag_id, hash_id FROM temp_operation WHERE job_id BETWEEN ? AND ?;', ( i, i + block_size - 1 ) )

                                    advanced_mappings_ids = HydrusData.BuildKeyToListDict( ( ( ( namespace_id, tag_id ), hash_id ) for ( namespace_id, tag_id, hash_id ) in advanced_mappings_ids ) )

                                    advanced_mappings_ids = [ ( namespace_id, tag_id, hash_ids ) for ( ( namespace_id, tag_id ), hash_ids ) in advanced_mappings_ids.items() ]

                                    if sub_action == 'copy':

                                        service_id_target = self._GetServiceId( service_key_target )

                                        service_target = self._GetService( service_id_target )

                                        if service_target.GetServiceType() == HC.LOCAL_TAG: kwarg = 'mappings_ids'
                                        else: kwarg = 'pending_mappings_ids'

                                        kwargs = { kwarg : advanced_mappings_ids }

                                        self._UpdateMappings( service_id_target, **kwargs )

                                    elif sub_action == 'delete':

                                        self._UpdateMappings( service_id, deleted_mappings_ids = advanced_mappings_ids )

                                    elif sub_action == 'delete_deleted':

                                        for ( namespace_id, tag_id, hash_ids ) in advanced_mappings_ids:

                                            self._c.execute( 'DELETE FROM ' + deleted_mappings_table_name + ' WHERE namespace_id = ? AND tag_id = ? AND hash_id IN ' + HydrusData.SplayListForDB( hash_ids ) + ';', ( namespace_id, tag_id ) )


                                        self._c.execute( 'DELETE FROM service_info WHERE service_id = ?;', ( service_id, ) )


                                    i += block_size


                                self._c.execute( 'DROP TABLE temp_operation;' )

                                self.pub_after_commit( 'notify_new_pending' )


                        else:

                            if action == HC.CONTENT_UPDATE_PETITION: ( tag, hashes, reason ) = row
                            else: ( tag, hashes ) = row

                            try: ( namespace_id, tag_id ) = self._GetNamespaceIdTagId( tag )
                            except HydrusExceptions.SizeException: continue

                            hash_ids = self._GetHashIds( hashes )

                            if action == HC.CONTENT_UPDATE_ADD: ultimate_mappings_ids.append( ( namespace_id, tag_id, hash_ids ) )
                            elif action == HC.CONTENT_UPDATE_DELETE: ultimate_deleted_mappings_ids.append( ( namespace_id, tag_id, hash_ids ) )
                            elif action == HC.CONTENT_UPDATE_PEND: ultimate_pending_mappings_ids.append( ( namespace_id, tag_id, hash_ids ) )
                            elif action == HC.CONTENT_UPDATE_RESCIND_PEND: ultimate_pending_rescinded_mappings_ids.append( ( namespace_id, tag_id, hash_ids ) )
                            elif action == HC.CONTENT_UPDATE_PETITION:

                                reason_id = self._GetTextId( reason )

                                ultimate_petitioned_mappings_ids.append( ( namespace_id, tag_id, hash_ids, reason_id ) )

                            elif action == HC.CONTENT_UPDATE_RESCIND_PETITION: ultimate_petitioned_rescinded_mappings_ids.append( ( namespace_id, tag_id, hash_ids ) )


                    elif data_type == HC.CONTENT_TYPE_TAG_SIBLINGS:

                        if action in ( HC.CONTENT_UPDATE_ADD, HC.CONTENT_UPDATE_DELETE ):

                            if action == HC.CONTENT_UPDATE_ADD: ( deletee_status, new_status ) = ( HC.PENDING, HC.CURRENT )
                            elif action == HC.CONTENT_UPDATE_DELETE: ( deletee_status, new_status ) = ( HC.PETITIONED, HC.DELETED )

                            ( old_tag, new_tag ) = row

                            try:

                                ( old_namespace_id, old_tag_id ) = self._GetNamespaceIdTagId( old_tag )

                                ( new_namespace_id, new_tag_id ) = self._GetNamespaceIdTagId( new_tag )

                            except HydrusExceptions.SizeException:

                                continue


                            self._c.execute( 'DELETE FROM tag_siblings WHERE service_id = ? AND old_namespace_id = ? AND old_tag_id = ?;', ( service_id, old_namespace_id, old_tag_id ) )
                            self._c.execute( 'DELETE FROM tag_sibling_petitions WHERE service_id = ? AND old_namespace_id = ? AND old_tag_id = ? AND status = ?;', ( service_id, old_namespace_id, old_tag_id, deletee_status ) )

                            self._c.execute( 'INSERT OR IGNORE INTO tag_siblings ( service_id, old_namespace_id, old_tag_id, new_namespace_id, new_tag_id, status ) VALUES ( ?, ?, ?, ?, ?, ? );', ( service_id, old_namespace_id, old_tag_id, new_namespace_id, new_tag_id, new_status ) )

                        elif action in ( HC.CONTENT_UPDATE_PEND, HC.CONTENT_UPDATE_PETITION ):

                            if action == HC.CONTENT_UPDATE_PEND: new_status = HC.PENDING
                            elif action == HC.CONTENT_UPDATE_PETITION: new_status = HC.PETITIONED

                            ( ( old_tag, new_tag ), reason ) = row

                            try:

                                ( old_namespace_id, old_tag_id ) = self._GetNamespaceIdTagId( old_tag )

                                ( new_namespace_id, new_tag_id ) = self._GetNamespaceIdTagId( new_tag )

                            except HydrusExceptions.SizeException:

                                continue


                            reason_id = self._GetTextId( reason )

                            self._c.execute( 'DELETE FROM tag_sibling_petitions WHERE service_id = ? AND old_namespace_id = ? AND old_tag_id = ?;', ( service_id, old_namespace_id, old_tag_id ) )

                            self._c.execute( 'INSERT OR IGNORE INTO tag_sibling_petitions ( service_id, old_namespace_id, old_tag_id, new_namespace_id, new_tag_id, reason_id, status ) VALUES ( ?, ?, ?, ?, ?, ?, ? );', ( service_id, old_namespace_id, old_tag_id, new_namespace_id, new_tag_id, reason_id, new_status ) )

                            notify_new_pending = True

                        elif action in ( HC.CONTENT_UPDATE_RESCIND_PEND, HC.CONTENT_UPDATE_RESCIND_PETITION ):

                            if action == HC.CONTENT_UPDATE_RESCIND_PEND:

                                deletee_status = HC.PENDING

                            elif action == HC.CONTENT_UPDATE_RESCIND_PETITION:

                                deletee_status = HC.PETITIONED


                            ( old_tag, new_tag ) = row

                            try:

                                ( old_namespace_id, old_tag_id ) = self._GetNamespaceIdTagId( old_tag )

                            except HydrusExceptions.SizeException:

                                continue


                            self._c.execute( 'DELETE FROM tag_sibling_petitions WHERE service_id = ? AND old_namespace_id = ? AND old_tag_id = ? AND status = ?;', ( service_id, old_namespace_id, old_tag_id, deletee_status ) )

                            notify_new_pending = True


                        notify_new_siblings = True

                    elif data_type == HC.CONTENT_TYPE_TAG_PARENTS:

                        if action in ( HC.CONTENT_UPDATE_ADD, HC.CONTENT_UPDATE_DELETE ):

                            if action == HC.CONTENT_UPDATE_ADD: ( deletee_status, new_status ) = ( HC.PENDING, HC.CURRENT )
                            elif action == HC.CONTENT_UPDATE_DELETE: ( deletee_status, new_status ) = ( HC.PETITIONED, HC.DELETED )

                            ( child_tag, parent_tag ) = row

                            try:

                                ( child_namespace_id, child_tag_id ) = self._GetNamespaceIdTagId( child_tag )

                                ( parent_namespace_id, parent_tag_id ) = self._GetNamespaceIdTagId( parent_tag )

                            except HydrusExceptions.SizeException: continue

                            self._c.execute( 'DELETE FROM tag_parents WHERE service_id = ? AND child_namespace_id = ? AND child_tag_id = ? AND parent_namespace_id = ? AND parent_tag_id = ?;', ( service_id, child_namespace_id, child_tag_id, parent_namespace_id, parent_tag_id ) )
                            self._c.execute( 'DELETE FROM tag_parent_petitions WHERE service_id = ? AND child_namespace_id = ? AND child_tag_id = ? AND parent_namespace_id = ? AND parent_tag_id = ? AND status = ?;', ( service_id, child_namespace_id, child_tag_id, parent_namespace_id, parent_tag_id, deletee_status ) )

                            self._c.execute( 'INSERT OR IGNORE INTO tag_parents ( service_id, child_namespace_id, child_tag_id, parent_namespace_id, parent_tag_id, status ) VALUES ( ?, ?, ?, ?, ?, ? );', ( service_id, child_namespace_id, child_tag_id, parent_namespace_id, parent_tag_id, new_status ) )

                            if action == HC.CONTENT_UPDATE_ADD:

                                ( current_mappings_table_name, deleted_mappings_table_name, pending_mappings_table_name, petitioned_mappings_table_name ) = GenerateMappingsTableNames( service_id )

                                existing_hash_ids = [ hash for ( hash, ) in self._c.execute( 'SELECT hash_id FROM ' + current_mappings_table_name + ' WHERE namespace_id = ? AND tag_id = ?;', ( child_namespace_id, child_tag_id ) ) ]

                                existing_hashes = self._GetHashes( existing_hash_ids )

                                mappings_ids = [ ( parent_namespace_id, parent_tag_id, existing_hash_ids ) ]

                                self._UpdateMappings( service_id, mappings_ids = mappings_ids )

                                special_content_update = HydrusData.ContentUpdate( HC.CONTENT_TYPE_MAPPINGS, HC.CONTENT_UPDATE_ADD, ( parent_tag, existing_hashes ) )

                                self.pub_content_updates_after_commit( { service_key : [ special_content_update ] } )


                        elif action in ( HC.CONTENT_UPDATE_PEND, HC.CONTENT_UPDATE_PETITION ):

                            if action == HC.CONTENT_UPDATE_PEND: new_status = HC.PENDING
                            elif action == HC.CONTENT_UPDATE_PETITION: new_status = HC.PETITIONED

                            ( ( child_tag, parent_tag ), reason ) = row

                            try:

                                ( child_namespace_id, child_tag_id ) = self._GetNamespaceIdTagId( child_tag )

                                ( parent_namespace_id, parent_tag_id ) = self._GetNamespaceIdTagId( parent_tag )

                            except HydrusExceptions.SizeException: continue

                            reason_id = self._GetTextId( reason )

                            self._c.execute( 'DELETE FROM tag_parent_petitions WHERE service_id = ? AND child_namespace_id = ? AND child_tag_id = ? AND parent_namespace_id = ? AND parent_tag_id = ?;', ( service_id, child_namespace_id, child_tag_id, parent_namespace_id, parent_tag_id ) )

                            self._c.execute( 'INSERT OR IGNORE INTO tag_parent_petitions ( service_id, child_namespace_id, child_tag_id, parent_namespace_id, parent_tag_id, reason_id, status ) VALUES ( ?, ?, ?, ?, ?, ?, ? );', ( service_id, child_namespace_id, child_tag_id, parent_namespace_id, parent_tag_id, reason_id, new_status ) )

                            notify_new_pending = True

                        elif action in ( HC.CONTENT_UPDATE_RESCIND_PEND, HC.CONTENT_UPDATE_RESCIND_PETITION ):

                            if action == HC.CONTENT_UPDATE_RESCIND_PEND: deletee_status = HC.PENDING
                            elif action == HC.CONTENT_UPDATE_RESCIND_PETITION: deletee_status = HC.PETITIONED

                            ( child_tag, parent_tag ) = row

                            try:

                                ( child_namespace_id, child_tag_id ) = self._GetNamespaceIdTagId( child_tag )

                                ( parent_namespace_id, parent_tag_id ) = self._GetNamespaceIdTagId( parent_tag )

                            except HydrusExceptions.SizeException: continue

                            self._c.execute( 'DELETE FROM tag_parent_petitions WHERE service_id = ? AND child_namespace_id = ? AND child_tag_id = ? AND parent_namespace_id = ? AND parent_tag_id = ? AND status = ?;', ( service_id, child_namespace_id, child_tag_id, parent_namespace_id, parent_tag_id, deletee_status ) )

                            notify_new_pending = True


                        notify_new_parents = True


                elif service_type in HC.RATINGS_SERVICES:

                    if action == HC.CONTENT_UPDATE_ADD:

                        ( rating, hashes ) = row

                        hash_ids = self._GetHashIds( hashes )

                        splayed_hash_ids = HydrusData.SplayListForDB( hash_ids )

                        if service_type in ( HC.LOCAL_RATING_LIKE, HC.LOCAL_RATING_NUMERICAL ):

                            ratings_added = 0

                            self._c.execute( 'DELETE FROM local_ratings WHERE service_id = ? AND hash_id IN ' + splayed_hash_ids + ';', ( service_id, ) )

                            ratings_added -= self._GetRowCount()

                            if rating is not None:

                                self._c.executemany( 'INSERT INTO local_ratings ( service_id, hash_id, rating ) VALUES ( ?, ?, ? );', [ ( service_id, hash_id, rating ) for hash_id in hash_ids ] )

                                ratings_added += self._GetRowCount()


                            self._c.execute( 'UPDATE service_info SET info = info + ? WHERE service_id = ? AND info_type = ?;', ( ratings_added, service_id, HC.SERVICE_INFO_NUM_FILES ) )

                            # and then do a thing here where it looks up remote services links and then pends/rescinds pends appropriately


            if len( ultimate_mappings_ids ) + len( ultimate_deleted_mappings_ids ) + len( ultimate_pending_mappings_ids ) + len( ultimate_pending_rescinded_mappings_ids ) + len( ultimate_petitioned_mappings_ids ) + len( ultimate_petitioned_rescinded_mappings_ids ) > 0:

                self._UpdateMappings( service_id, mappings_ids = ultimate_mappings_ids, deleted_mappings_ids = ultimate_deleted_mappings_ids, pending_mappings_ids = ultimate_pending_mappings_ids, pending_rescinded_mappings_ids = ultimate_pending_rescinded_mappings_ids, petitioned_mappings_ids = ultimate_petitioned_mappings_ids, petitioned_rescinded_mappings_ids = ultimate_petitioned_rescinded_mappings_ids )

                notify_new_pending = True


        if do_pubsubs:

            if notify_new_downloads:

                self.pub_after_commit( 'notify_new_downloads' )

            if notify_new_pending:

                self.pub_after_commit( 'notify_new_pending' )

            if notify_new_siblings:

                self.pub_after_commit( 'notify_new_siblings_data' )
                self.pub_after_commit( 'notify_new_siblings_gui' )
                self.pub_after_commit( 'notify_new_parents' )

            elif notify_new_parents:

                self.pub_after_commit( 'notify_new_parents' )


            self.pub_content_updates_after_commit( service_keys_to_content_updates )


    def _ProcessServiceUpdates( self, service_keys_to_service_updates ):

        do_new_permissions = False

        hydrus_requests_made = []
        local_booru_requests_made = []

        for ( service_key, service_updates ) in service_keys_to_service_updates.items():

            try:

                service_id = self._GetServiceId( service_key )

            except HydrusExceptions.DataMissing:

                continue


            if service_id in self._service_cache: del self._service_cache[ service_id ]

            service = self._GetService( service_id )

            ( service_key, service_type, name, info ) = service.ToTuple()

            for service_update in service_updates:

                ( action, row ) = service_update.ToTuple()

                if action == HC.SERVICE_UPDATE_ACCOUNT:

                    account = row

                    update = { 'account' : account, 'last_error' : 0 }

                    self._UpdateServiceInfo( service_id, update )

                    do_new_permissions = True

                elif action == HC.SERVICE_UPDATE_ERROR:

                    update = { 'last_error' : HydrusData.GetNow() }

                    self._UpdateServiceInfo( service_id, update )

                elif action == HC.SERVICE_UPDATE_REQUEST_MADE:

                    num_bytes = row

                    if service_type == HC.LOCAL_BOORU: local_booru_requests_made.append( num_bytes )
                    else: hydrus_requests_made.append( ( service_id, num_bytes ) )

                elif action == HC.SERVICE_UPDATE_NEWS:

                    news_rows = row

                    self._c.executemany( 'INSERT OR IGNORE INTO news VALUES ( ?, ?, ? );', [ ( service_id, post, timestamp ) for ( post, timestamp ) in news_rows ] )

                    now = HydrusData.GetNow()

                    for ( post, timestamp ) in news_rows:

                        if not HydrusData.TimeHasPassed( timestamp + 86400 * 7 ):

                            text = name + ' at ' + time.ctime( timestamp ) + ':' + os.linesep * 2 + post

                            job_key = ClientThreading.JobKey()

                            job_key.SetVariable( 'popup_text_1', text )

                            self.pub_after_commit( 'message', job_key )


                elif action == HC.SERVICE_UPDATE_NEXT_DOWNLOAD_TIMESTAMP:

                    next_download_timestamp = row

                    if next_download_timestamp > info[ 'next_download_timestamp' ]:

                        if info[ 'first_timestamp' ] is None: update = { 'first_timestamp' : next_download_timestamp, 'next_download_timestamp' : next_download_timestamp }
                        else: update = { 'next_download_timestamp' : next_download_timestamp }

                        self._UpdateServiceInfo( service_id, update )


                elif action == HC.SERVICE_UPDATE_NEXT_PROCESSING_TIMESTAMP:

                    next_processing_timestamp = row

                    if next_processing_timestamp > info[ 'next_processing_timestamp' ]:

                        info_update = { 'next_processing_timestamp' : next_processing_timestamp }

                        self._UpdateServiceInfo( service_id, info_update )


                elif action == HC.SERVICE_UPDATE_PAUSE:

                    info_update = { 'paused' : True }

                    self._UpdateServiceInfo( service_id, info_update )


            self.pub_service_updates_after_commit( service_keys_to_service_updates )


        for ( service_id, nums_bytes ) in HydrusData.BuildKeyToListDict( hydrus_requests_made ).items():

            service = self._GetService( service_id )

            info = service.GetInfo()

            account = info[ 'account' ]

            for num_bytes in nums_bytes: account.RequestMade( num_bytes )

            self._c.execute( 'UPDATE services SET info = ? WHERE service_id = ?;', ( info, service_id ) )


        if len( local_booru_requests_made ) > 0:

            service_id = self._GetServiceId( CC.LOCAL_BOORU_SERVICE_KEY )

            service = self._GetService( service_id )

            info = service.GetInfo()

            info[ 'used_monthly_data' ] += sum( local_booru_requests_made )
            info[ 'used_monthly_requests' ] += len( local_booru_requests_made )

            self._c.execute( 'UPDATE services SET info = ? WHERE service_id = ?;', ( info, service_id ) )


        if do_new_permissions: self.pub_after_commit( 'notify_new_permissions' )


    def _PushRecentTags( self, service_key, tags ):

        service_id = self._GetServiceId( service_key )

        if tags is None:

            self._c.execute( 'DELETE FROM recent_tags WHERE service_id = ?;', ( service_id, ) )

        else:

            now = HydrusData.GetNow()

            tag_ids = [ self._GetNamespaceIdTagId( tag ) for tag in tags ]

            self._c.executemany( 'REPLACE INTO recent_tags ( service_id, namespace_id, tag_id, timestamp ) VALUES ( ?, ?, ?, ? );', ( ( service_id, namespace_id, tag_id, now ) for ( namespace_id, tag_id ) in tag_ids ) )


    def _Read( self, action, *args, **kwargs ):

        if action == 'autocomplete_predicates': result = self._GetAutocompletePredicates( *args, **kwargs )
        elif action == 'client_files_locations': result = self._GetClientFilesLocations( *args, **kwargs )
        elif action == 'downloads': result = self._GetDownloads( *args, **kwargs )
        elif action == 'file_hashes': result = self._GetFileHashes( *args, **kwargs )
        elif action == 'file_query_ids': result = self._GetHashIdsFromQuery( *args, **kwargs )
        elif action == 'file_system_predicates': result = self._GetFileSystemPredicates( *args, **kwargs )
        elif action == 'filter_hashes': result = self._FilterHashes( *args, **kwargs )
        elif action == 'hydrus_sessions': result = self._GetHydrusSessions( *args, **kwargs )
        elif action == 'imageboards': result = self._GetYAMLDump( YAML_DUMP_ID_IMAGEBOARD, *args, **kwargs )
        elif action == 'is_an_orphan': result = self._IsAnOrphan( *args, **kwargs )
        elif action == 'known_urls': result = self._GetKnownURLs( *args, **kwargs )
        elif action == 'load_into_disk_cache': result = self._LoadIntoDiskCache( *args, **kwargs )
        elif action == 'local_booru_share_keys': result = self._GetYAMLDumpNames( YAML_DUMP_ID_LOCAL_BOORU )
        elif action == 'local_booru_share': result = self._GetYAMLDump( YAML_DUMP_ID_LOCAL_BOORU, *args, **kwargs )
        elif action == 'local_booru_shares': result = self._GetYAMLDump( YAML_DUMP_ID_LOCAL_BOORU )
        elif action == 'maintenance_due': result = self._MaintenanceDue( *args, **kwargs )
        elif action == 'md5_status': result = self._GetMD5Status( *args, **kwargs )
        elif action == 'media_results': result = self._GetMediaResultsFromHashes( *args, **kwargs )
        elif action == 'media_results_from_ids': result = self._GetMediaResults( *args, **kwargs )
        elif action == 'news': result = self._GetNews( *args, **kwargs )
        elif action == 'nums_pending': result = self._GetNumsPending( *args, **kwargs )
        elif action == 'trash_hashes': result = self._GetTrashHashes( *args, **kwargs )
        elif action == 'options': result = self._GetOptions( *args, **kwargs )
        elif action == 'pending': result = self._GetPending( *args, **kwargs )
        elif action == 'recent_tags': result = self._GetRecentTags( *args, **kwargs )
        elif action == 'remote_booru': result = self._GetYAMLDump( YAML_DUMP_ID_REMOTE_BOORU, *args, **kwargs )
        elif action == 'remote_boorus': result = self._GetYAMLDump( YAML_DUMP_ID_REMOTE_BOORU )
        elif action == 'serialisable': result = self._GetJSONDump( *args, **kwargs )
        elif action == 'serialisable_simple': result = self._GetJSONSimple( *args, **kwargs )
        elif action == 'serialisable_named': result = self._GetJSONDumpNamed( *args, **kwargs )
        elif action == 'serialisable_names': result = self._GetJSONDumpNames( *args, **kwargs )
        elif action == 'service_directory': result = self._GetServiceDirectoryHashes( *args, **kwargs )
        elif action == 'service_directories': result = self._GetServiceDirectoriesInfo( *args, **kwargs )
        elif action == 'service_filenames': result = self._GetServiceFilenames( *args, **kwargs )
        elif action == 'service_info': result = self._GetServiceInfo( *args, **kwargs )
        elif action == 'services': result = self._GetServices( *args, **kwargs )
        elif action == 'similar_files_maintenance_status': result = self._CacheSimilarFilesGetMaintenanceStatus( *args, **kwargs )
        elif action == 'related_tags': result = self._GetRelatedTags( *args, **kwargs )
        elif action == 'tag_censorship': result = self._GetTagCensorship( *args, **kwargs )
        elif action == 'tag_parents': result = self._GetTagParents( *args, **kwargs )
        elif action == 'tag_siblings': result = self._GetTagSiblings( *args, **kwargs )
        elif action == 'remote_thumbnail_hashes_i_should_have': result = self._GetRemoteThumbnailHashesIShouldHave( *args, **kwargs )
        elif action == 'url_status': result = self._GetURLStatus( *args, **kwargs )
        elif action == 'web_sessions': result = self._GetWebSessions( *args, **kwargs )
        else: raise Exception( 'db received an unknown read command: ' + action )

        return result


    def _RelocateClientFiles( self, prefix, source, dest ):

        full_source = os.path.join( source, prefix )
        full_dest = os.path.join( dest, prefix )

        if os.path.exists( full_source ):

            HydrusPaths.MergeTree( full_source, full_dest )

        elif not os.path.exists( full_dest ):

            HydrusPaths.MakeSureDirectoryExists( full_dest )


        portable_dest = HydrusPaths.ConvertAbsPathToPortablePath( dest )

        self._c.execute( 'UPDATE client_files_locations SET location = ? WHERE prefix = ?;', ( portable_dest, prefix ) )

        if os.path.exists( full_source ):

            try: HydrusPaths.RecyclePath( full_source )
            except: pass


    def _RegenerateACCache( self ):

        job_key = ClientThreading.JobKey()

        job_key.SetVariable( 'popup_title', 'regenerating autocomplete cache' )

        self._controller.pub( 'message', job_key )

        tag_service_ids = self._GetServiceIds( HC.TAG_SERVICES )
        file_service_ids = self._GetServiceIds( HC.AUTOCOMPLETE_CACHE_SPECIFIC_FILE_SERVICES )

        for ( file_service_id, tag_service_id ) in itertools.product( file_service_ids, tag_service_ids ):

            job_key.SetVariable( 'popup_text_1', 'generating specific ac_cache ' + str( file_service_id ) + '_' + str( tag_service_id ) )

            self._CacheSpecificMappingsDrop( file_service_id, tag_service_id )

            self._CacheSpecificMappingsGenerate( file_service_id, tag_service_id )


        for tag_service_id in tag_service_ids:

            job_key.SetVariable( 'popup_text_1', 'generating combined files ac_cache ' + str( tag_service_id ) )

            self._CacheCombinedFilesMappingsDrop( tag_service_id )

            self._CacheCombinedFilesMappingsGenerate( tag_service_id )


        job_key.SetVariable( 'popup_text_1', 'done!' )


    def _ResetService( self, service_key, delete_updates = False ):

        self._c.execute( 'COMMIT;' )

        if not self._fast_big_transaction_wal:

            self._c.execute( 'PRAGMA journal_mode = TRUNCATE;' )


        self._c.execute( 'PRAGMA foreign_keys = ON;' )

        self._c.execute( 'BEGIN IMMEDIATE;' )

        service_id = self._GetServiceId( service_key )

        service = self._GetService( service_id )

        ( service_key, service_type, name, info ) = service.ToTuple()

        prefix = 'resetting ' + name

        job_key = ClientThreading.JobKey()

        job_key.SetVariable( 'popup_text_1', prefix + ': deleting service' )

        self._controller.pub( 'message', job_key )

        self._DeleteService( service_id, delete_update_dir = delete_updates )

        if service_type in HC.REPOSITORIES:

            job_key.SetVariable( 'popup_text_1', prefix + ': deleting downloaded updates' )

            if delete_updates:

                info[ 'first_timestamp' ] = None
                info[ 'next_download_timestamp' ] = 0


            info[ 'next_processing_timestamp' ] = 0

            self.pub_after_commit( 'notify_restart_repo_sync_daemon' )


        job_key.SetVariable( 'popup_text_1', prefix + ': recreating service' )

        self._AddService( service_key, service_type, name, info )

        self.pub_after_commit( 'notify_new_pending' )
        self.pub_after_commit( 'notify_new_services_data' )
        self.pub_after_commit( 'notify_new_services_gui' )

        job_key.SetVariable( 'popup_text_1', prefix + ': done!' )

        self._c.execute( 'COMMIT;' )

        self._InitDBCursor()

        self._c.execute( 'BEGIN IMMEDIATE;' )

        job_key.Finish()


    def _SaveOptions( self, options ):

        ( old_options, ) = self._c.execute( 'SELECT options FROM options;' ).fetchone()

        ( old_width, old_height ) = old_options[ 'thumbnail_dimensions' ]

        ( new_width, new_height ) = options[ 'thumbnail_dimensions' ]

        self._c.execute( 'UPDATE options SET options = ?;', ( options, ) )

        resize_thumbs = new_width != old_width or new_height != old_height

        if resize_thumbs:

            self.pub_after_commit( 'thumbnail_resize' )


        self.pub_after_commit( 'notify_new_options' )


    def _SetJSONDump( self, obj ):

        if isinstance( obj, HydrusSerialisable.SerialisableBaseNamed ):

            ( dump_type, dump_name, version, serialisable_info ) = obj.GetSerialisableTuple()

            try:

                dump = json.dumps( serialisable_info )

            except Exception as e:

                HydrusData.ShowException( e )
                HydrusData.Print( obj )
                HydrusData.Print( serialisable_info )

                raise Exception( 'Trying to json dump the object ' + HydrusData.ToUnicode( obj ) + ' with name ' + dump_name + ' caused an error. Its serialisable info has been dumped to the log.' )


            self._c.execute( 'DELETE FROM json_dumps_named WHERE dump_type = ? AND dump_name = ?;', ( dump_type, dump_name ) )

            self._c.execute( 'INSERT INTO json_dumps_named ( dump_type, dump_name, version, dump ) VALUES ( ?, ?, ?, ? );', ( dump_type, dump_name, version, sqlite3.Binary( dump ) ) )

        else:

            ( dump_type, version, serialisable_info ) = obj.GetSerialisableTuple()

            try:

                dump = json.dumps( serialisable_info )

            except Exception as e:

                HydrusData.ShowException( e )
                HydrusData.Print( obj )
                HydrusData.Print( serialisable_info )

                raise Exception( 'Trying to json dump the object ' + HydrusData.ToUnicode( obj ) + ' caused an error. Its serialisable info has been dumped to the log.' )


            self._c.execute( 'DELETE FROM json_dumps WHERE dump_type = ?;', ( dump_type, ) )

            self._c.execute( 'INSERT INTO json_dumps ( dump_type, version, dump ) VALUES ( ?, ?, ? );', ( dump_type, version, sqlite3.Binary( dump ) ) )


    def _SetJSONSimple( self, name, value ):

        if value is None:

            self._c.execute( 'DELET FROM json_dict WHERE name = ?;', ( name, ) )

        else:

            json_dump = json.dumps( value )

            self._c.execute( 'REPLACE INTO json_dict ( name, dump ) VALUES ( ?, ? );', ( name, sqlite3.Binary( json_dump ) ) )


    def _SetPassword( self, password ):

        if password is not None:

            # to convert from unusual unicode types
            password_bytes = HydrusData.ToByteString( password )

            password = hashlib.sha256( password_bytes ).digest()


        options = self._controller.GetOptions()

        options[ 'password' ] = password

        self._SaveOptions( options )


    def _SetServiceFilename( self, service_id, hash_id, filename ):

        self._c.execute( 'REPLACE INTO service_filenames ( service_id, hash_id, filename ) VALUES ( ?, ?, ? );', ( service_id, hash_id, filename ) )


    def _SetServiceDirectory( self, service_id, hash_ids, dirname, note ):

        directory_id = self._GetTextId( dirname )

        self._c.execute( 'DELETE FROM service_directories WHERE service_id = ? AND directory_id = ?;', ( service_id, directory_id ) )
        self._c.execute( 'DELETE FROM service_directory_file_map WHERE service_id = ? AND directory_id = ?;', ( service_id, directory_id ) )

        num_files = len( hash_ids )

        result = self._c.execute( 'SELECT SUM( size ) FROM files_info WHERE hash_id IN ' + HydrusData.SplayListForDB( hash_ids ) + ';' ).fetchone()

        if result is None:

            total_size = 0

        else:

            ( total_size, ) = result


        self._c.execute( 'INSERT INTO service_directories ( service_id, directory_id, num_files, total_size, note ) VALUES ( ?, ?, ?, ?, ? );', ( service_id, directory_id, num_files, total_size, note ) )
        self._c.executemany( 'INSERT INTO service_directory_file_map ( service_id, directory_id, hash_id ) VALUES ( ?, ?, ? );', ( ( service_id, directory_id, hash_id ) for hash_id in hash_ids ) )


    def _SetTagCensorship( self, info ):

        self._c.execute( 'DELETE FROM tag_censorship;' )

        for ( service_key, blacklist, tags ) in info:

            service_id = self._GetServiceId( service_key )

            self._c.execute( 'INSERT OR IGNORE INTO tag_censorship ( service_id, blacklist, tags ) VALUES ( ?, ?, ? );', ( service_id, blacklist, tags ) )


        self.pub_after_commit( 'notify_new_tag_censorship' )


    def _SetYAMLDump( self, dump_type, dump_name, data ):

        if dump_type == YAML_DUMP_ID_SUBSCRIPTION: self._subscriptions_cache[ dump_name ] = data

        if dump_type == YAML_DUMP_ID_LOCAL_BOORU: dump_name = dump_name.encode( 'hex' )

        self._c.execute( 'DELETE FROM yaml_dumps WHERE dump_type = ? AND dump_name = ?;', ( dump_type, dump_name ) )

        try: self._c.execute( 'INSERT INTO yaml_dumps ( dump_type, dump_name, dump ) VALUES ( ?, ?, ? );', ( dump_type, dump_name, data ) )
        except:

            HydrusData.Print( ( dump_type, dump_name, data ) )

            raise


        if dump_type == YAML_DUMP_ID_LOCAL_BOORU:

            service_id = self._GetServiceId( CC.LOCAL_BOORU_SERVICE_KEY )

            self._c.execute( 'DELETE FROM service_info WHERE service_id = ? AND info_type = ?;', ( service_id, HC.SERVICE_INFO_NUM_SHARES ) )

            self._controller.pub( 'refresh_local_booru_shares' )


    def _SyncHashesToTagArchive( self, hashes, hta_path, tag_service_key, adding, namespaces ):

        hta = HydrusTagArchive.HydrusTagArchive( hta_path )

        hash_type = hta.GetHashType()

        content_updates = []

        for hash in hashes:

            if hash_type == HydrusTagArchive.HASH_TYPE_SHA256: archive_hash = hash
            else:

                hash_id = self._GetHashId( hash )

                if hash_type == HydrusTagArchive.HASH_TYPE_MD5: h = 'md5'
                elif hash_type == HydrusTagArchive.HASH_TYPE_SHA1: h = 'sha1'
                elif hash_type == HydrusTagArchive.HASH_TYPE_SHA512: h = 'sha512'

                try: ( archive_hash, ) = self._c.execute( 'SELECT ' + h + ' FROM local_hashes WHERE hash_id = ?;', ( hash_id, ) ).fetchone()
                except: return


            tags = HydrusTags.CleanTags( hta.GetTags( archive_hash ) )

            desired_tags = HydrusTags.FilterNamespaces( tags, namespaces )

            if len( desired_tags ) > 0:

                if tag_service_key != CC.LOCAL_TAG_SERVICE_KEY and not adding:

                    action = HC.CONTENT_UPDATE_PETITION

                    rows = [ ( tag, ( hash, ), 'admin: tag archive desync' ) for tag in desired_tags ]

                else:

                    if adding:

                        if tag_service_key == CC.LOCAL_TAG_SERVICE_KEY: action = HC.CONTENT_UPDATE_ADD
                        else: action = HC.CONTENT_UPDATE_PEND

                    else: action = HC.CONTENT_UPDATE_DELETE

                    rows = [ ( tag, ( hash, )  ) for tag in desired_tags ]


                content_updates.extend( [ HydrusData.ContentUpdate( HC.CONTENT_TYPE_MAPPINGS, action, row ) for row in rows ] )


        if len( content_updates ) > 0:

            service_keys_to_content_updates = { tag_service_key : content_updates }

            self._ProcessContentUpdates( service_keys_to_content_updates )


    def _TagExists( self, tag ):

        if ':' in tag:

            ( namespace, tag ) = tag.split( ':', 1 )

            result = self._c.execute( 'SELECT namespace_id FROM namespaces WHERE namespace = ?;', ( namespace, ) ).fetchone()

            if result is None:

                return False


        result = self._c.execute( 'SELECT tag_id FROM tags WHERE tag = ?;', ( tag, ) ).fetchone()

        if result is None:

            return False

        else:

            return True


    def _UpdateDB( self, version ):

        self._controller.pub( 'splash_set_title_text', 'updating db to v' + str( version + 1 ) )

        if version == 192:

            no_wal_path = os.path.join( self._db_dir, 'no-wal' )

            if os.path.exists( no_wal_path ):

                os.remove( no_wal_path )


        if version == 193:

            self._c.execute( 'CREATE TABLE service_filenames ( service_id INTEGER REFERENCES services ON DELETE CASCADE, hash_id INTEGER, filename TEXT, PRIMARY KEY( service_id, hash_id ) );' )


        if version == 194:

            service_data = self._c.execute( 'SELECT service_id, info FROM services WHERE service_type IN ( ?, ? );', ( HC.FILE_REPOSITORY, HC.TAG_REPOSITORY ) ).fetchall()

            for ( service_id, info ) in service_data:

                info[ 'next_processing_timestamp' ] = 0

                self._c.execute( 'UPDATE services SET info = ? WHERE service_id = ?;', ( info, service_id ) )


            #

            service_data = self._c.execute( 'SELECT service_id, info FROM services WHERE service_type = ?;', ( HC.IPFS, ) ).fetchall()

            for ( service_id, info ) in service_data:

                info[ 'multihash_prefix' ] = ''

                self._c.execute( 'UPDATE services SET info = ? WHERE service_id = ?;', ( info, service_id ) )


        if version == 195:

            self._controller.pub( 'splash_set_status_text', 'clearing out surplus autocomplete entries' )

            combined_tag_service_id = self._GetServiceId( CC.COMBINED_TAG_SERVICE_KEY )

            self._c.execute( 'DELETE FROM autocomplete_tags_cache WHERE tag_service_id = ?;', ( combined_tag_service_id, ) )

            #

            self._controller.pub( 'splash_set_status_text', 'clearing out existing tags orphans' )

            self._c.execute( 'DELETE FROM existing_tags;' )

            self._c.execute( 'INSERT OR IGNORE INTO existing_tags SELECT DISTINCT namespace_id, tag_id FROM mappings;' )
            self._c.execute( 'INSERT OR IGNORE INTO existing_tags SELECT DISTINCT child_namespace_id, child_tag_id FROM tag_parents;' )
            self._c.execute( 'INSERT OR IGNORE INTO existing_tags SELECT DISTINCT parent_namespace_id, parent_tag_id FROM tag_parents;' )
            self._c.execute( 'INSERT OR IGNORE INTO existing_tags SELECT DISTINCT old_namespace_id, old_tag_id FROM tag_siblings;' )
            self._c.execute( 'INSERT OR IGNORE INTO existing_tags SELECT DISTINCT new_namespace_id, new_tag_id FROM tag_siblings;' )

            #

            self._controller.pub( 'splash_set_status_text', 'clearing out orphan autocomplete entries' )

            namespace_ids = [ namespace_id for ( namespace_id, ) in self._c.execute( 'SELECT namespace_id FROM namespaces;' ) ]

            for namespace_id in namespace_ids:

                self._c.execute( 'DELETE FROM autocomplete_tags_cache WHERE namespace_id = ? AND tag_id NOT IN ( SELECT tag_id FROM existing_tags WHERE namespace_id = ? );', ( namespace_id, namespace_id ) )


        if version == 196:

            self._controller.pub( 'splash_set_status_text', 'clearing out more surplus autocomplete entries' )

            combined_file_service_id = self._GetServiceId( CC.COMBINED_FILE_SERVICE_KEY )

            self._c.execute( 'DELETE FROM autocomplete_tags_cache WHERE file_service_id != ?;', ( combined_file_service_id, ) )


        if version == 198:

            all_service_info = self._c.execute( 'SELECT * FROM services;' ).fetchall()

            self._c.execute( 'DROP TABLE services;' )

            self._c.execute( 'CREATE TABLE services ( service_id INTEGER PRIMARY KEY AUTOINCREMENT, service_key BLOB_BYTES, service_type INTEGER, name TEXT, info TEXT_YAML );' )
            self._c.execute( 'CREATE UNIQUE INDEX services_service_key_index ON services ( service_key );' )

            self._c.executemany( 'INSERT INTO services VALUES ( ?, ?, ?, ?, ? );', ( ( service_id, sqlite3.Binary( service_key ), service_type, name, info ) for ( service_id, service_key, service_type, name, info ) in all_service_info ) )

            self._c.execute( 'DROP TABLE autocomplete_tags_cache;' )

            #

            self._controller.pub( 'splash_set_status_text', 'exporting mappings to external db' )

            self._c.execute( 'CREATE TABLE IF NOT EXISTS external_mappings.mappings ( service_id INTEGER, namespace_id INTEGER, tag_id INTEGER, hash_id INTEGER, status INTEGER, PRIMARY KEY( service_id, namespace_id, tag_id, hash_id, status ) );' )

            self._c.execute( 'INSERT INTO external_mappings.mappings SELECT * FROM main.mappings;' )

            self._c.execute( 'DROP TABLE main.mappings;' )

            self._c.execute( 'CREATE TABLE IF NOT EXISTS external_mappings.mapping_petitions ( service_id INTEGER, namespace_id INTEGER, tag_id INTEGER, hash_id INTEGER, reason_id INTEGER, PRIMARY KEY( service_id, namespace_id, tag_id, hash_id, reason_id ) );' )

            self._c.execute( 'INSERT INTO external_mappings.mapping_petitions SELECT * FROM main.mapping_petitions;' )

            self._c.execute( 'DROP TABLE main.mapping_petitions;' )


        if version == 199:

            self._c.execute( 'CREATE TABLE json_dict ( name TEXT PRIMARY KEY, dump BLOB_BYTES );' )

            results = self._GetYAMLDump( YAML_DUMP_ID_SINGLE )

            for ( name, value ) in results.items():

                self._SetJSONSimple( name, value )


            self._c.execute( 'DELETE FROM yaml_dumps WHERE dump_type = ?;', ( YAML_DUMP_ID_SINGLE, ) )

            #

            self._controller.pub( 'splash_set_status_text', 'exporting deleted mappings to new table' )

            self._c.execute( 'CREATE TABLE IF NOT EXISTS external_mappings.deleted_mappings ( service_id INTEGER, namespace_id INTEGER, tag_id INTEGER, hash_id INTEGER, PRIMARY KEY( service_id, namespace_id, tag_id, hash_id ) );' )

            self._c.execute( 'INSERT INTO external_mappings.deleted_mappings SELECT service_id, namespace_id, tag_id, hash_id FROM mappings WHERE status = ?;', ( HC.DELETED, ) )

            self._c.execute( 'DELETE FROM mappings WHERE status = ?;', ( HC.DELETED, ) )

            self._c.execute( 'CREATE INDEX IF NOT EXISTS external_mappings.deleted_mappings_namespace_id_index ON deleted_mappings ( namespace_id );' )
            self._c.execute( 'CREATE INDEX IF NOT EXISTS external_mappings.deleted_mappings_tag_id_index ON deleted_mappings ( tag_id );' )
            self._c.execute( 'CREATE INDEX IF NOT EXISTS external_mappings.deleted_mappings_hash_id_index ON deleted_mappings ( hash_id );' )


        if version == 200:

            self._controller.pub( 'splash_set_status_text', 'deleting service mapping orphans' )

            names = { name for ( name, ) in self._c.execute( 'SELECT name FROM external_mappings.sqlite_master WHERE type = ?;', ( 'table', ) ) }

            if 'mappings' in names: # it is possible that at least one user did the update, but the subsequent vacuum failed, so the version didn't increment, so this catches them

                service_ids = self._GetServiceIds( HC.TAG_SERVICES )

                splayed_service_ids = HydrusData.SplayListForDB( service_ids )

                self._c.execute( 'DELETE FROM mappings WHERE service_id NOT IN ' + splayed_service_ids + ';' )
                self._c.execute( 'DELETE FROM deleted_mappings WHERE service_id NOT IN ' + splayed_service_ids + ';' )
                self._c.execute( 'DELETE FROM mapping_petitions WHERE service_id NOT IN ' + splayed_service_ids + ';' )

                #

                self._controller.pub( 'splash_set_status_text', 'exporting hashes to external db' )

                self._c.execute( 'CREATE TABLE IF NOT EXISTS external_master.hashes ( hash_id INTEGER PRIMARY KEY, hash BLOB_BYTES UNIQUE );' )

                self._c.execute( 'INSERT INTO external_master.hashes SELECT * FROM main.hashes;' )

                self._c.execute( 'DROP TABLE main.hashes;' )

                #

                self._controller.pub( 'splash_set_status_text', 'exporting tags to external db' )

                self._c.execute( 'CREATE TABLE IF NOT EXISTS external_master.namespaces ( namespace_id INTEGER PRIMARY KEY, namespace TEXT UNIQUE );' )

                self._c.execute( 'INSERT INTO external_master.namespaces SELECT * FROM main.namespaces;' )

                self._c.execute( 'DROP TABLE main.namespaces;' )

                #

                self._c.execute( 'CREATE TABLE IF NOT EXISTS external_master.tags ( tag_id INTEGER PRIMARY KEY, tag TEXT UNIQUE );' )

                self._c.execute( 'INSERT INTO external_master.tags SELECT * FROM main.tags;' )

                self._c.execute( 'DROP TABLE main.tags;' )

                self._c.execute( 'DROP TABLE main.tags_fts4;' )

                self._c.execute( 'CREATE VIRTUAL TABLE IF NOT EXISTS external_master.tags_fts4 USING fts4( tag );' )

                self._c.execute( 'REPLACE INTO tags_fts4 ( docid, tag ) SELECT * FROM tags;' )

                #

                self._controller.pub( 'splash_set_status_text', 'splitting and compacting mappings tables' )

                mapping_petitions_rip = self._c.execute( 'SELECT * FROM mapping_petitions;' ).fetchall()

                self._c.execute( 'DROP TABLE mapping_petitions;' )

                self._c.execute( 'CREATE TABLE IF NOT EXISTS external_mappings.mapping_petitions ( service_id INTEGER, namespace_id INTEGER, tag_id INTEGER, hash_id INTEGER, reason_id INTEGER, PRIMARY KEY( service_id, namespace_id, tag_id, hash_id, reason_id ) ) WITHOUT ROWID;' )

                self._c.executemany( 'INSERT INTO mapping_petitions VALUES ( ?, ?, ?, ?, ? );', mapping_petitions_rip )

                self._c.execute( 'CREATE INDEX IF NOT EXISTS external_mappings.mapping_petitions_hash_id_index ON mapping_petitions ( hash_id );' )

                del mapping_petitions_rip

                #

                deleted_mappings_rip = self._c.execute( 'SELECT * FROM deleted_mappings;' ).fetchall()

                self._c.execute( 'DROP TABLE deleted_mappings;' )

                self._c.execute( 'CREATE TABLE IF NOT EXISTS external_mappings.deleted_mappings ( service_id INTEGER, namespace_id INTEGER, tag_id INTEGER, hash_id INTEGER, PRIMARY KEY( service_id, namespace_id, tag_id, hash_id ) ) WITHOUT ROWID;' )

                self._c.executemany( 'INSERT INTO deleted_mappings VALUES ( ?, ?, ?, ? );', deleted_mappings_rip )

                self._c.execute( 'CREATE INDEX IF NOT EXISTS external_mappings.deleted_mappings_namespace_id_index ON deleted_mappings ( namespace_id );' )
                self._c.execute( 'CREATE INDEX IF NOT EXISTS external_mappings.deleted_mappings_tag_id_index ON deleted_mappings ( tag_id );' )
                self._c.execute( 'CREATE INDEX IF NOT EXISTS external_mappings.deleted_mappings_hash_id_index ON deleted_mappings ( hash_id );' )

                del deleted_mappings_rip

                #

                self._c.execute( 'CREATE TABLE IF NOT EXISTS external_mappings.current_mappings ( service_id INTEGER, namespace_id INTEGER, tag_id INTEGER, hash_id INTEGER, PRIMARY KEY( service_id, namespace_id, tag_id, hash_id ) ) WITHOUT ROWID;' )

                self._c.execute( 'INSERT INTO current_mappings SELECT service_id, namespace_id, tag_id, hash_id FROM mappings WHERE status = ?;', ( HC.CURRENT, ) )

                self._c.execute( 'CREATE TABLE IF NOT EXISTS external_mappings.pending_mappings ( service_id INTEGER, namespace_id INTEGER, tag_id INTEGER, hash_id INTEGER, PRIMARY KEY( service_id, namespace_id, tag_id, hash_id ) ) WITHOUT ROWID;' )

                self._c.execute( 'INSERT INTO pending_mappings SELECT service_id, namespace_id, tag_id, hash_id FROM mappings WHERE status = ?;', ( HC.PENDING, ) )

                self._c.execute( 'DROP TABLE mappings;' )

                self._controller.pub( 'splash_set_status_text', 'creating mappings indices' )

                self._c.execute( 'CREATE INDEX IF NOT EXISTS external_mappings.current_mappings_namespace_id_index ON current_mappings ( namespace_id );' )
                self._c.execute( 'CREATE INDEX IF NOT EXISTS external_mappings.current_mappings_tag_id_index ON current_mappings ( tag_id );' )
                self._c.execute( 'CREATE INDEX IF NOT EXISTS external_mappings.current_mappings_hash_id_index ON current_mappings ( hash_id );' )

                self._c.execute( 'CREATE INDEX IF NOT EXISTS external_mappings.pending_mappings_namespace_id_index ON pending_mappings ( namespace_id );' )
                self._c.execute( 'CREATE INDEX IF NOT EXISTS external_mappings.pending_mappings_tag_id_index ON pending_mappings ( tag_id );' )
                self._c.execute( 'CREATE INDEX IF NOT EXISTS external_mappings.pending_mappings_hash_id_index ON pending_mappings ( hash_id );' )

                #

                self._c.execute( 'DELETE FROM service_info;' )

                self._c.execute( 'COMMIT;' )

                self._CloseDBCursor()

                try:

                    for filename in self._db_filenames.values():

                        self._controller.pub( 'splash_set_status_text', 'vacuuming ' + filename )

                        db_path = os.path.join( self._db_dir, filename )

                        try:

                            if HydrusDB.CanVacuum( db_path ):

                                HydrusDB.VacuumDB( db_path )


                        except Exception as e:

                            HydrusData.Print( 'Vacuum failed!' )
                            HydrusData.PrintException( e )


                finally:

                    self._InitDBCursor()

                    self._c.execute( 'BEGIN IMMEDIATE;' )


        if version == 201:

            file_service_ids = self._GetServiceIds( ( HC.LOCAL_FILE_DOMAIN, HC.FILE_REPOSITORY ) )
            tag_service_ids = self._GetServiceIds( ( HC.LOCAL_TAG, HC.TAG_REPOSITORY ) )

            for ( file_service_id, tag_service_id ) in itertools.product( file_service_ids, tag_service_ids ):

                self._controller.pub( 'splash_set_status_text', 'generating specific ac_cache ' + str( file_service_id ) + '_' + str( tag_service_id ) )

                # this is a direct copy of the old code, as v204 ditched current_mappings, breaking the call
                # I've flattened all the other subcalls as well, just in case they soon change

                suffix = str( file_service_id ) + '_' + str( tag_service_id )

                files_table_name = 'external_caches.specific_files_cache_' + suffix

                current_mappings_table_name = 'external_caches.specific_current_mappings_cache_' + suffix

                pending_mappings_table_name = 'external_caches.specific_pending_mappings_cache_' + suffix

                ac_cache_table_name = 'external_caches.specific_ac_cache_' + suffix

                self._c.execute( 'CREATE TABLE ' + files_table_name + ' ( hash_id INTEGER PRIMARY KEY );' )

                self._c.execute( 'CREATE TABLE ' + current_mappings_table_name + ' ( hash_id INTEGER, namespace_id INTEGER, tag_id INTEGER, PRIMARY KEY( hash_id, namespace_id, tag_id ) ) WITHOUT ROWID;' )

                self._c.execute( 'CREATE TABLE ' + pending_mappings_table_name + ' ( hash_id INTEGER, namespace_id INTEGER, tag_id INTEGER, PRIMARY KEY( hash_id, namespace_id, tag_id ) ) WITHOUT ROWID;' )

                self._c.execute( 'CREATE TABLE ' + ac_cache_table_name + ' ( namespace_id INTEGER, tag_id INTEGER, current_count INTEGER, pending_count INTEGER, PRIMARY KEY( namespace_id, tag_id ) ) WITHOUT ROWID;' )

                #

                hash_ids = [ hash_id for ( hash_id, ) in self._c.execute( 'SELECT hash_id FROM current_files WHERE service_id = ?;', ( file_service_id, ) ) ]

                if len( hash_ids ) > 0:

                    self._c.executemany( 'INSERT OR IGNORE INTO ' + files_table_name + ' VALUES ( ? );', ( ( hash_id, ) for hash_id in hash_ids ) )

                    ac_cache_changes = []

                    for group_of_hash_ids in HydrusData.SplitListIntoChunks( hash_ids, 100 ):

                        splayed_group_of_hash_ids = HydrusData.SplayListForDB( group_of_hash_ids )

                        current_mapping_ids_raw = self._c.execute( 'SELECT namespace_id, tag_id, hash_id FROM current_mappings WHERE service_id = ? AND hash_id IN ' + splayed_group_of_hash_ids + ';', ( tag_service_id, ) ).fetchall()

                        current_mapping_ids_dict = HydrusData.BuildKeyToSetDict( [ ( ( namespace_id, tag_id ), hash_id ) for ( namespace_id, tag_id, hash_id ) in current_mapping_ids_raw ] )

                        pending_mapping_ids_raw = self._c.execute( 'SELECT namespace_id, tag_id, hash_id FROM pending_mappings WHERE service_id = ? AND hash_id IN ' + splayed_group_of_hash_ids + ';', ( tag_service_id, ) ).fetchall()

                        pending_mapping_ids_dict = HydrusData.BuildKeyToSetDict( [ ( ( namespace_id, tag_id ), hash_id ) for ( namespace_id, tag_id, hash_id ) in pending_mapping_ids_raw ] )

                        all_ids_seen = set( current_mapping_ids_dict.keys() )
                        all_ids_seen.update( pending_mapping_ids_dict.keys() )

                        for ( namespace_id, tag_id ) in all_ids_seen:

                            current_hash_ids = current_mapping_ids_dict[ ( namespace_id, tag_id ) ]

                            num_current = len( current_hash_ids )

                            if num_current > 0:

                                self._c.executemany( 'INSERT OR IGNORE INTO ' + current_mappings_table_name + ' ( hash_id, namespace_id, tag_id ) VALUES ( ?, ?, ? );', ( ( hash_id, namespace_id, tag_id ) for hash_id in current_hash_ids ) )


                            pending_hash_ids = pending_mapping_ids_dict[ ( namespace_id, tag_id ) ]

                            num_pending = len( pending_hash_ids )

                            if num_pending > 0:

                                self._c.executemany( 'INSERT OR IGNORE INTO ' + pending_mappings_table_name + ' ( hash_id, namespace_id, tag_id ) VALUES ( ?, ?, ? );', ( ( hash_id, namespace_id, tag_id ) for hash_id in pending_hash_ids ) )


                            if num_current > 0 or num_pending > 0:

                                ac_cache_changes.append( ( namespace_id, tag_id, num_current, num_pending ) )


                    if len( ac_cache_changes ) > 0:

                        self._c.executemany( 'INSERT OR IGNORE INTO ' + ac_cache_table_name + ' ( namespace_id, tag_id, current_count, pending_count ) VALUES ( ?, ?, ?, ? );', ( ( namespace_id, tag_id, 0, 0 ) for ( namespace_id, tag_id, num_current, num_pending ) in ac_cache_changes ) )

                        self._c.executemany( 'UPDATE ' + ac_cache_table_name + ' SET current_count = current_count + ?, pending_count = pending_count + ? WHERE namespace_id = ? AND tag_id = ?;', ( ( num_current, num_pending, namespace_id, tag_id ) for ( namespace_id, tag_id, num_current, num_pending ) in ac_cache_changes ) )


            for tag_service_id in tag_service_ids:

                self._controller.pub( 'splash_set_status_text', 'generating combined files ac_cache ' + str( tag_service_id ) )

                # this is a direct copy of the old code, as v204 ditched current_mappings, breaking the call
                # I've flattened all the other subcalls as well, just in case they soon change

                ac_cache_table_name = 'external_caches.combined_files_ac_cache_' + str( tag_service_id )

                self._c.execute( 'CREATE TABLE ' + ac_cache_table_name + ' ( namespace_id INTEGER, tag_id INTEGER, current_count INTEGER, pending_count INTEGER, PRIMARY KEY( namespace_id, tag_id ) ) WITHOUT ROWID;' )

                #

                current_mappings_exist = self._c.execute( 'SELECT 1 FROM current_mappings WHERE service_id = ? LIMIT 1;', ( tag_service_id, ) ).fetchone() is not None
                pending_mappings_exist = self._c.execute( 'SELECT 1 FROM pending_mappings WHERE service_id = ? LIMIT 1;', ( tag_service_id, ) ).fetchone() is not None

                if current_mappings_exist or pending_mappings_exist:

                    all_known_ids = self._c.execute( 'SELECT namespace_id, tag_id FROM existing_tags;' ).fetchall()

                    for group_of_ids in HydrusData.SplitListIntoChunks( all_known_ids, 10000 ):

                        current_counter = collections.Counter()

                        if current_mappings_exist:

                            for ( namespace_id, tag_id ) in group_of_ids:

                                result = self._c.execute( 'SELECT COUNT( * ) FROM current_mappings WHERE service_id = ? AND namespace_id = ? AND tag_id = ?;', ( tag_service_id, namespace_id, tag_id ) ).fetchone()

                                if result is not None:

                                    ( count, ) = result

                                    if count > 0:

                                        current_counter[ ( namespace_id, tag_id ) ] = count


                        #

                        pending_counter = collections.Counter()

                        if pending_mappings_exist:

                            for ( namespace_id, tag_id ) in group_of_ids:

                                result = self._c.execute( 'SELECT COUNT( * ) FROM pending_mappings WHERE service_id = ? AND namespace_id = ? AND tag_id = ?;', ( tag_service_id, namespace_id, tag_id ) ).fetchone()

                                if result is not None:

                                    ( count, ) = result

                                    if count > 0:

                                        pending_counter[ ( namespace_id, tag_id ) ] = count


                        all_ids_seen = set( current_counter.keys() )
                        all_ids_seen.update( pending_counter.keys() )

                        count_ids = [ ( namespace_id, tag_id, current_counter[ ( namespace_id, tag_id ) ], pending_counter[ ( namespace_id, tag_id ) ] ) for ( namespace_id, tag_id ) in all_ids_seen ]

                        if len( count_ids ) > 0:

                            self._c.executemany( 'INSERT OR IGNORE INTO ' + ac_cache_table_name + ' ( namespace_id, tag_id, current_count, pending_count ) VALUES ( ?, ?, ?, ? );', ( ( namespace_id, tag_id, 0, 0 ) for ( namespace_id, tag_id, current_delta, pending_delta ) in count_ids ) )

                            self._c.executemany( 'UPDATE ' + ac_cache_table_name + ' SET current_count = current_count + ?, pending_count = pending_count + ? WHERE namespace_id = ? AND tag_id = ?;', ( ( current_delta, pending_delta, namespace_id, tag_id ) for ( namespace_id, tag_id, current_delta, pending_delta ) in count_ids ) )

                            self._c.executemany( 'DELETE FROM ' + ac_cache_table_name + ' WHERE namespace_id = ? AND tag_id = ? AND current_count = ? AND pending_count = ?;', ( ( namespace_id, tag_id, 0, 0 ) for ( namespace_id, tag_id, current_delta, pending_delta ) in count_ids ) )


            cache_dir = os.path.join( self._db_dir, 'client_cache' )

            if os.path.exists( cache_dir ):

                try:

                    HydrusPaths.DeletePath( cache_dir )

                except Exception as e:

                    HydrusData.Print( 'Tried to delete the superfluous cache dir, but got an error:' )

                    HydrusData.PrintException( e )


        if version == 202:

            self._c.execute( 'DELETE FROM analyze_timestamps;' )


        if version == 203:

            service_ids = self._GetServiceIds( HC.TAG_SERVICES )

            for service_id in service_ids:

                self._controller.pub( 'splash_set_status_text', 'creating new mappings tables: ' + str( service_id ) )

                ( current_mappings_table_name, deleted_mappings_table_name, pending_mappings_table_name, petitioned_mappings_table_name ) = GenerateMappingsTableNames( service_id )

                self._c.execute( 'CREATE TABLE IF NOT EXISTS ' + current_mappings_table_name + ' ( namespace_id INTEGER, tag_id INTEGER, hash_id INTEGER, PRIMARY KEY( namespace_id, tag_id, hash_id ) ) WITHOUT ROWID;' )

                self._c.execute( 'CREATE TABLE IF NOT EXISTS ' + deleted_mappings_table_name + ' ( namespace_id INTEGER, tag_id INTEGER, hash_id INTEGER, PRIMARY KEY( namespace_id, tag_id, hash_id ) ) WITHOUT ROWID;' )

                self._c.execute( 'CREATE TABLE IF NOT EXISTS ' + pending_mappings_table_name + ' ( namespace_id INTEGER, tag_id INTEGER, hash_id INTEGER, PRIMARY KEY( namespace_id, tag_id, hash_id ) ) WITHOUT ROWID;' )

                self._c.execute( 'CREATE TABLE IF NOT EXISTS ' + petitioned_mappings_table_name + ' ( namespace_id INTEGER, tag_id INTEGER, hash_id INTEGER, reason_id INTEGER, PRIMARY KEY( namespace_id, tag_id, hash_id, reason_id ) ) WITHOUT ROWID;' )

                #

                self._c.execute( 'INSERT OR IGNORE INTO ' + current_mappings_table_name + ' SELECT namespace_id, tag_id, hash_id FROM current_mappings WHERE service_id = ?;', ( service_id, ) )
                self._c.execute( 'INSERT OR IGNORE INTO ' + deleted_mappings_table_name + ' SELECT namespace_id, tag_id, hash_id FROM deleted_mappings WHERE service_id = ?;', ( service_id, ) )
                self._c.execute( 'INSERT OR IGNORE INTO ' + pending_mappings_table_name + ' SELECT namespace_id, tag_id, hash_id FROM pending_mappings WHERE service_id = ?;', ( service_id, ) )
                self._c.execute( 'INSERT OR IGNORE INTO ' + petitioned_mappings_table_name + ' SELECT namespace_id, tag_id, hash_id, reason_id FROM mapping_petitions WHERE service_id = ?;', ( service_id, ) )

                #

                self._controller.pub( 'splash_set_status_text', 'creating new mappings indices: ' + str( service_id ) )

                current_mappings_table_simple_name = current_mappings_table_name.split( '.' )[1]
                deleted_mappings_table_simple_name = deleted_mappings_table_name.split( '.' )[1]
                pending_mappings_table_simple_name = pending_mappings_table_name.split( '.' )[1]
                petitioned_mappings_table_simple_name = petitioned_mappings_table_name.split( '.' )[1]

                self._c.execute( 'CREATE INDEX IF NOT EXISTS ' + current_mappings_table_name + '_tag_id_index ON ' + current_mappings_table_simple_name + ' ( tag_id );' )
                self._c.execute( 'CREATE INDEX IF NOT EXISTS ' + current_mappings_table_name + '_hash_id_index ON ' + current_mappings_table_simple_name + ' ( hash_id );' )

                self._c.execute( 'CREATE INDEX IF NOT EXISTS ' + deleted_mappings_table_name + '_hash_id_index ON ' + deleted_mappings_table_simple_name + ' ( hash_id );' )

                self._c.execute( 'CREATE INDEX IF NOT EXISTS ' + pending_mappings_table_name + '_tag_id_index ON ' + pending_mappings_table_simple_name + ' ( tag_id );' )
                self._c.execute( 'CREATE INDEX IF NOT EXISTS ' + pending_mappings_table_name + '_hash_id_index ON ' + pending_mappings_table_simple_name + ' ( hash_id );' )

                self._c.execute( 'CREATE INDEX IF NOT EXISTS ' + petitioned_mappings_table_name + '_hash_id_index ON ' + petitioned_mappings_table_simple_name + ' ( hash_id );' )


            self._c.execute( 'DROP TABLE current_mappings;' )
            self._c.execute( 'DROP TABLE pending_mappings;' )
            self._c.execute( 'DROP TABLE deleted_mappings;' )
            self._c.execute( 'DROP TABLE mapping_petitions;' )

            self._controller.pub( 'splash_set_status_text', 'analyzing new tables' )

            self._AnalyzeStaleBigTables()

            self._c.execute( 'COMMIT;' )

            self._CloseDBCursor()

            try:

                for filename in self._db_filenames.values():

                    self._controller.pub( 'splash_set_status_text', 'vacuuming ' + filename )

                    db_path = os.path.join( self._db_dir, filename )

                    try:

                        if HydrusDB.CanVacuum( db_path ):

                            HydrusDB.VacuumDB( db_path )


                    except Exception as e:

                        HydrusData.Print( 'Vacuum failed!' )
                        HydrusData.PrintException( e )


            finally:

                self._InitDBCursor()

                self._c.execute( 'BEGIN IMMEDIATE;' )


        if version == 204:

            self._c.execute( 'DROP TABLE shutdown_timestamps;' )

            self._c.execute( 'CREATE TABLE vacuum_timestamps ( name TEXT, timestamp INTEGER );' )


        if version == 205:

            self._c.execute( 'CREATE TABLE service_directories ( service_id INTEGER REFERENCES services ON DELETE CASCADE, directory_id INTEGER, num_files INTEGER, total_size INTEGER, PRIMARY KEY( service_id, directory_id ) );' )
            self._c.execute( 'CREATE TABLE service_directory_file_map ( service_id INTEGER REFERENCES services ON DELETE CASCADE, directory_id INTEGER, hash_id INTEGER, PRIMARY KEY( service_id, directory_id, hash_id ) );' )

            #

            self._c.execute( 'CREATE TABLE IF NOT EXISTS external_master.texts ( text_id INTEGER PRIMARY KEY, text TEXT UNIQUE );' )

            #

            self._c.execute( 'INSERT OR IGNORE INTO texts SELECT reason_id, reason FROM reasons;' )

            self._c.execute( 'DROP TABLE reasons;' )


        if version == 206:

            self._c.execute( 'DELETE FROM json_dumps_named WHERE dump_type = ? AND dump_name = ?;', ( HydrusSerialisable.SERIALISABLE_TYPE_SHORTCUTS, 'default' ) )


        if version == 207:

            info = self._c.execute( 'SELECT * FROM service_directories;' ).fetchall()

            self._c.execute( 'DROP TABLE service_directories;' )

            #

            self._c.execute( 'CREATE TABLE service_directories ( service_id INTEGER REFERENCES services ON DELETE CASCADE, directory_id INTEGER, num_files INTEGER, total_size INTEGER, note TEXT, PRIMARY KEY( service_id, directory_id ) );' )

            self._c.executemany( 'INSERT INTO service_directories ( service_id, directory_id, num_files, total_size, note ) VALUES ( ?, ?, ?, ?, ? );', ( ( service_id, directory_id, num_files, total_size, '' ) for ( service_id, directory_id, num_files, total_size ) in info ) )


        if version == 208:

            result = self._c.execute( 'SELECT prefix, location FROM client_files_locations;' ).fetchall()

            result.sort()

            old_thumbnail_dir = os.path.join( self._db_dir, 'client_thumbnails' )

            for ( i, ( prefix, location ) ) in enumerate( result ):

                self._controller.pub( 'splash_set_status_text', 'moving thumbnails: ' + HydrusData.ConvertValueRangeToPrettyString( i + 1, 256 ) )

                source_dir = os.path.join( old_thumbnail_dir, prefix )
                dest_dir = os.path.join( location, prefix )

                source_filenames = os.listdir( source_dir )

                for source_filename in source_filenames:

                    source_path = os.path.join( source_dir, source_filename )

                    if source_filename.endswith( '_resized' ):

                        encoded_hash = source_filename[:64]

                        dest_filename = encoded_hash + '.thumbnail.resized'

                    else:

                        encoded_hash = source_filename

                        dest_filename = encoded_hash + '.thumbnail'


                    dest_path = os.path.join( dest_dir, dest_filename )

                    try:

                        HydrusPaths.MergeFile( source_path, dest_path )

                    except:

                        HydrusData.Print( 'Problem moving thumbnail from ' + source_path + ' to ' + dest_path + '.' )
                        HydrusData.Print( 'Abandoning thumbnail transfer for ' + source_dir + '.' )

                        break


            try:

                HydrusPaths.DeletePath( old_thumbnail_dir )

            except:

                HydrusData.Print( 'Could not delete old thumbnail directory at ' + old_thumbnail_dir )


        if version == 209:

            update_dirnames = os.listdir( self._updates_dir )

            for update_dirname in update_dirnames:

                update_dir = os.path.join( self._updates_dir, update_dirname )

                if os.path.isdir( update_dir ):

                    update_filenames = os.listdir( update_dir )

                    for update_filename in update_filenames:

                        update_path = os.path.join( update_dir, update_filename )

                        try:

                            with open( update_path, 'rb' ) as f:

                                content = f.read()


                            obj = HydrusSerialisable.CreateFromString( content )

                            compressed_content = obj.DumpToNetworkString()

                            with open( update_path, 'wb' ) as f:

                                f.write( compressed_content )


                        except:

                            HydrusData.Print( 'The path ' + update_path + ' failed to convert to a network string.' )


        if version == 211:

            self._c.execute( 'REPLACE INTO yaml_dumps VALUES ( ?, ?, ? );', ( YAML_DUMP_ID_REMOTE_BOORU, 'rule34@booru.org', ClientDefaults.GetDefaultBoorus()[ 'rule34@booru.org' ] ) )

            #

            try:

                service_data = self._c.execute( 'SELECT service_id, info FROM services;' ).fetchall()

                client_archives_folder = os.path.join( self._db_dir, 'client_archives' )

                for ( service_id, info ) in service_data:

                    if 'tag_archive_sync' in info:

                        tas_flat = info[ 'tag_archive_sync' ].items()

                        info[ 'tag_archive_sync' ] = { HydrusPaths.ConvertAbsPathToPortablePath( os.path.join( client_archives_folder, archive_name + '.db', HC.BASE_DIR ) ) : namespaces for ( archive_name, namespaces ) in tas_flat }

                        self._c.execute( 'UPDATE services SET info = ? WHERE service_id = ?;', ( info, service_id ) )


            except Exception as e:

                HydrusData.Print( 'Trying to update tag archive location caused the following problem:' )

                HydrusData.PrintException( e )


        if version == 212:

            prefixes_to_locations = dict( self._c.execute( 'SELECT prefix, location FROM client_files_locations;' ).fetchall() )

            ( total_to_do, ) = self._c.execute( 'SELECT COUNT( * ) FROM files_info WHERE mime IN ( ?, ? );', ( HC.IMAGE_PNG, HC.IMAGE_GIF ) ).fetchone()

            for ( i, ( hash, mime ) ) in enumerate( self._c.execute( 'SELECT hash, mime FROM files_info, hashes USING ( hash_id ) WHERE mime IN ( ?, ? );', ( HC.IMAGE_PNG, HC.IMAGE_GIF ) ) ):

                if ( i + 1 ) % 50 == 0:

                    self._controller.pub( 'splash_set_status_text', 'regenerating thumbnails: ' + HydrusData.ConvertValueRangeToPrettyString( i + 1, total_to_do ) )


                hash_hex = hash.encode( 'hex' )

                prefix = hash_hex[:2]

                ext = HC.mime_ext_lookup[ mime ]

                path_base = os.path.join( prefixes_to_locations[ prefix ], prefix, hash_hex )

                file_path = path_base + ext

                if os.path.exists( file_path ):

                    try:

                        thumbnail_path = path_base + '.thumbnail'
                        resized_thumbnail_path = path_base + '.thumbnail.resized'

                        if os.path.exists( thumbnail_path ):

                            os.remove( thumbnail_path )


                        if os.path.exists( resized_thumbnail_path ):

                            os.remove( resized_thumbnail_path )


                        thumbnail = HydrusFileHandling.GenerateThumbnail( file_path )

                        with open( thumbnail_path, 'wb' ) as f:

                            f.write( thumbnail )


                    except Exception as e:

                        HydrusData.Print( 'Failed to regen thumbnail for ' + file_path + '! Error was:' )
                        HydrusData.PrintException( e )


            #

            # manage services was accidentally sometimes allowing people to create noneditable services

            self._service_cache = {}

            local_booru_service_id = self._GetServiceId( CC.LOCAL_BOORU_SERVICE_KEY )
            local_tag_service_id = self._GetServiceId( CC.LOCAL_TAG_SERVICE_KEY )

            local_service_ids = self._GetServiceIds( ( HC.LOCAL_BOORU, HC.LOCAL_TAG ) )

            bad_local_service_ids = [ local_service_id for local_service_id in local_service_ids if local_service_id not in ( local_booru_service_id, local_tag_service_id ) ]

            for bad_local_service_id in bad_local_service_ids:

                try:

                    self._DeleteService( bad_local_service_id )

                except Exception as e:

                    HydrusData.Print( 'Failed to delete service ' + str( bad_local_service_id ) + '! Error was:' )
                    HydrusData.PrintException( e )


        if version == 214:

            # missed foreign key, so clean out any orphan entries here

            service_ids = { service_id for ( service_id, ) in self._c.execute( 'SELECT service_id FROM services;' ) }

            info = [ ( service_id, hash_id, reason_id ) for ( service_id, hash_id, reason_id ) in self._c.execute( 'SELECT * FROM file_petitions;' ) if service_id in service_ids ]

            self._c.execute( 'DROP TABLE file_petitions;' )

            self._c.execute( 'CREATE TABLE file_petitions ( service_id INTEGER REFERENCES services ON DELETE CASCADE, hash_id INTEGER, reason_id INTEGER, PRIMARY KEY( service_id, hash_id, reason_id ) );' )
            self._c.execute( 'CREATE INDEX file_petitions_hash_id_index ON file_petitions ( hash_id );' )

            self._c.executemany( 'INSERT INTO file_petitions ( service_id, hash_id, reason_id ) VALUES ( ?, ?, ? );', info )

            #

            self._c.execute( 'REPLACE INTO yaml_dumps VALUES ( ?, ?, ? );', ( YAML_DUMP_ID_REMOTE_BOORU, 'sankaku chan', ClientDefaults.GetDefaultBoorus()[ 'sankaku chan' ] ) )


        if version == 215:

            info = self._c.execute( 'SELECT prefix, location FROM client_files_locations;' ).fetchall()

            self._c.execute( 'DELETE FROM client_files_locations;' )

            for ( i, ( prefix, location ) ) in enumerate( info ):

                self._c.execute( 'INSERT INTO client_files_locations ( prefix, location ) VALUES ( ?, ? );', ( 'f' + prefix, location ) )
                self._c.execute( 'INSERT INTO client_files_locations ( prefix, location ) VALUES ( ?, ? );', ( 't' + prefix, location ) )
                self._c.execute( 'INSERT INTO client_files_locations ( prefix, location ) VALUES ( ?, ? );', ( 'r' + prefix, location ) )

                location = HydrusPaths.ConvertPortablePathToAbsPath( location, HC.BASE_DIR )

                text_prefix = 'rearranging client files: ' + HydrusData.ConvertValueRangeToPrettyString( i + 1, 256 ) + ', '

                source = os.path.join( location, prefix )
                file_dest = os.path.join( location, 'f' + prefix )
                thumb_dest = os.path.join( location, 't' + prefix )
                resized_dest = os.path.join( location, 'r' + prefix )

                if os.path.exists( source ): # recover from this update being previously interrupted

                    HydrusPaths.MergeTree( source, file_dest )

                    HydrusPaths.MakeSureDirectoryExists( thumb_dest )
                    HydrusPaths.MakeSureDirectoryExists( resized_dest )

                    filenames = os.listdir( file_dest )

                    num_to_do = len( filenames )

                    for ( j, filename ) in enumerate( filenames ):

                        if j % 100 == 0:

                            self._controller.pub( 'splash_set_status_text', text_prefix + HydrusData.ConvertValueRangeToPrettyString( j, num_to_do ) )


                        source_path = os.path.join( file_dest, filename )

                        if source_path.endswith( 'thumbnail' ):

                            dest_path = os.path.join( thumb_dest, filename )

                            HydrusPaths.MergeFile( source_path, dest_path )

                        elif source_path.endswith( 'resized' ):

                            dest_path = os.path.join( resized_dest, filename )

                            HydrusPaths.MergeFile( source_path, dest_path )


        if version == 220:

            self._c.execute( 'CREATE TABLE recent_tags ( service_id INTEGER REFERENCES services ON DELETE CASCADE, namespace_id INTEGER, tag_id INTEGER, timestamp INTEGER, PRIMARY KEY ( service_id, namespace_id, tag_id ) );' )


        if version == 228:

            # now db_dir is moveable, updating portable path base from base_dir to db_dir

            def update_portable_path( p ):

                if p is None:

                    return p


                p = os.path.normpath( p ) # collapses .. stuff and converts / to \\ for windows only

                if os.path.isabs( p ):

                    a_p = p

                else:

                    a_p = os.path.normpath( os.path.join( HC.BASE_DIR, p ) )


                if not HC.PLATFORM_WINDOWS and not os.path.exists( a_p ):

                    a_p = a_p.replace( '\\', '/' )


                try:

                    p = os.path.relpath( a_p, self._db_dir )

                    if p.startswith( '..' ):

                        p = a_p


                except:

                    p = a_p


                if HC.PLATFORM_WINDOWS:

                    p = p.replace( '\\', '/' ) # store seps as /, to maintain multiplatform uniformity


                return p


            #

            try:

                service_data = self._c.execute( 'SELECT service_id, info FROM services;' ).fetchall()

                for ( service_id, info ) in service_data:

                    if 'tag_archive_sync' in info:

                        improved_tas = {}

                        for ( old_portable_path, namespaces ) in info[ 'tag_archive_sync' ].items():

                            new_portable_path = update_portable_path( old_portable_path )

                            improved_tas[ new_portable_path ] = namespaces


                        info[ 'tag_archive_sync' ] = improved_tas

                        self._c.execute( 'UPDATE services SET info = ? WHERE service_id = ?;', ( info, service_id ) )


            except Exception as e:

                HydrusData.Print( 'Trying to update tag archive portable location caused the following problem:' )

                HydrusData.PrintException( e )


            #

            try:

                client_files_locations = self._c.execute( 'SELECT prefix, location FROM client_files_locations;' ).fetchall()

                improved_cfs = []

                for ( prefix, old_portable_location ) in client_files_locations:

                    new_portable_location = update_portable_path( old_portable_location )

                    improved_cfs.append( ( prefix, new_portable_location ) )


                self._c.executemany( 'REPLACE INTO client_files_locations ( prefix, location ) VALUES ( ?, ? );', improved_cfs )

            except Exception as e:

                HydrusData.Print( 'Trying to update client files portable locations caused the following problem:' )

                HydrusData.PrintException( e )


            #

            try:

                options = self._GetOptions()

                options[ 'export_path' ] = update_portable_path( options[ 'export_path' ] )

                self._c.execute( 'UPDATE options SET options = ?;', ( options, ) )

            except Exception as e:

                HydrusData.Print( 'Trying to update export path portable location caused the following problem:' )

                HydrusData.PrintException( e )


        if version == 229:

            self._c.executemany( 'INSERT OR IGNORE INTO json_dumps_named VALUES ( ?, ?, ?, ? );', [ ( 32, 'gelbooru md5', 1, '''["http://gelbooru.com/index.php", 0, 1, 1, "md5", {"s": "list", "page": "post"}, [[30, 1, ["we got sent back to main gallery page -- title test", 8, [27, 1, [[["head", {}, 0], ["title", {}, 0]], null]], [true, true, "Image List"]]], [30, 1, ["", 0, [27, 1, [[["li", {"class": "tag-type-general"}, null], ["a", {}, 1]], null]], ""]], [30, 1, ["", 0, [27, 1, [[["li", {"class": "tag-type-copyright"}, null], ["a", {}, 1]], null]], "series"]], [30, 1, ["", 0, [27, 1, [[["li", {"class": "tag-type-artist"}, null], ["a", {}, 1]], null]], "creator"]], [30, 1, ["", 0, [27, 1, [[["li", {"class": "tag-type-character"}, null], ["a", {}, 1]], null]], "character"]], [30, 1, ["we got sent back to main gallery page -- page links exist", 8, [27, 1, [[["div", {}, null]], "class"]], [true, true, "pagination"]]]]]''' ) ] )


        if version == 230:

            self._c.executemany( 'INSERT OR IGNORE INTO json_dumps_named VALUES ( ?, ?, ?, ? );', [ ( 32, 'iqdb danbooru', 1, '''["http://danbooru.iqdb.org/", 1, 0, 0, "file", {}, [[29, 1, ["link to danbooru", [27, 1, [[["td", {"class": "image"}, 1], ["a", {}, 0]], "href"]], [[30, 1, ["", 0, [27, 1, [[["section", {"id": "tag-list"}, 0], ["li", {"class": "category-1"}, null], ["a", {"class": "search-tag"}, 0]], null]], "creator"]], [30, 1, ["", 0, [27, 1, [[["section", {"id": "tag-list"}, 0], ["li", {"class": "category-3"}, null], ["a", {"class": "search-tag"}, 0]], null]], "series"]], [30, 1, ["", 0, [27, 1, [[["section", {"id": "tag-list"}, 0], ["li", {"class": "category-4"}, null], ["a", {"class": "search-tag"}, 0]], null]], "character"]], [30, 1, ["", 0, [27, 1, [[["section", {"id": "tag-list"}, 0], ["li", {"class": "category-0"}, null], ["a", {"class": "search-tag"}, 0]], null]], ""]]]]], [30, 1, ["no iqdb match found", 8, [27, 1, [[["th", {}, null]], null]], [false, true, "Best match"]]]]]''' ) ] )


        if version == 233:

            self._controller.pub( 'splash_set_status_text', 'moving phashes from main to cache' )

            self._c.execute( 'CREATE TABLE external_caches.shape_perceptual_hashes ( phash_id INTEGER PRIMARY KEY, phash BLOB_BYTES UNIQUE );' )

            self._c.execute( 'CREATE TABLE external_caches.shape_perceptual_hash_map ( phash_id INTEGER, hash_id INTEGER, PRIMARY KEY ( phash_id, hash_id ) );' )
            self._c.execute( 'CREATE INDEX external_caches.shape_perceptual_hash_map_hash_id_index ON shape_perceptual_hash_map ( hash_id );' )

            try:

                def GetPHashId( phash ):

                    result = self._c.execute( 'SELECT phash_id FROM shape_perceptual_hashes WHERE phash = ?;', ( sqlite3.Binary( phash ), ) ).fetchone()

                    if result is None:

                        self._c.execute( 'INSERT INTO shape_perceptual_hashes ( phash ) VALUES ( ? );', ( sqlite3.Binary( phash ), ) )

                        phash_id = self._c.lastrowid

                    else:

                        ( phash_id, ) = result


                    return phash_id


                current_phash_info = self._c.execute( 'SELECT hash_id, phash FROM main.perceptual_hashes;' ).fetchall()

                num_to_do = len( current_phash_info )

                for ( i, ( hash_id, phash ) ) in enumerate( current_phash_info ):

                    if i % 500 == 0:

                        self._controller.pub( 'splash_set_status_text', 'moving phashes: ' + HydrusData.ConvertValueRangeToPrettyString( i, num_to_do ) )


                    phash_id = GetPHashId( phash )

                    self._c.execute( 'INSERT OR IGNORE INTO shape_perceptual_hash_map ( phash_id, hash_id ) VALUES ( ?, ? );', ( phash_id, hash_id ) )


            except Exception as e:

                HydrusData.PrintException( e )

                self._controller.pub( 'splash_set_status_text', 'moving phashes failed, error written to log' )

                time.sleep( 3 )


            self._c.execute( 'DROP TABLE main.perceptual_hashes;' )

            #

            self._controller.pub( 'splash_set_status_text', 'removing redundant trash deletion record' )

            try:

                trash_service_id = self._GetServiceId( CC.TRASH_SERVICE_KEY )

                self._c.execute( 'DELETE FROM deleted_files WHERE service_id = ?;', ( trash_service_id, ) )

                self._c.execute( 'DELETE FROM service_info WHERE service_id = ? AND info_type = ?;', ( trash_service_id, HC.SERVICE_INFO_NUM_DELETED_FILES ) )

            except Exception as e:

                HydrusData.PrintException( e )

                self._controller.pub( 'splash_set_status_text', 'removing trash deletion record failed, error written to log' )


        if version == 234:

            self._c.execute( 'CREATE TABLE external_caches.shape_vptree ( phash_id INTEGER PRIMARY KEY, parent_id INTEGER, radius INTEGER, inner_id INTEGER, inner_population INTEGER, outer_id INTEGER, outer_population INTEGER );' )
            self._c.execute( 'CREATE INDEX external_caches.shape_vptree_parent_id_index ON shape_vptree ( parent_id );' )

            self._c.execute( 'CREATE TABLE external_caches.shape_maintenance_phash_regen ( hash_id INTEGER PRIMARY KEY );' )
            self._c.execute( 'CREATE TABLE external_caches.shape_maintenance_branch_regen ( phash_id INTEGER PRIMARY KEY );' )

            # now to populate it!

            prefix = 'generating faster duplicate search data - '
            self._controller.pub( 'splash_set_status_text', prefix + 'gathering leaves' )

            all_nodes = self._c.execute( 'SELECT phash_id, phash FROM shape_perceptual_hashes;' ).fetchall()

            if len( all_nodes ) > 0:

                ( root_id, root_phash ) = HydrusData.RandomPop( all_nodes )

                process_queue = [ ( None, root_id, root_phash, all_nodes ) ]

                insert_rows = []

                num_done = 0
                num_to_do = len( all_nodes ) + 1

                while len( process_queue ) > 0:

                    if num_done % 500 == 0:

                        self._controller.pub( 'splash_set_status_text', prefix + HydrusData.ConvertValueRangeToPrettyString( num_done, num_to_do ) )


                    ( parent_id, phash_id, phash, children ) = process_queue.pop( 0 )

                    if len( children ) == 0:

                        inner_id = None
                        inner_population = 0

                        outer_id = None
                        outer_population = 0

                        radius = None

                    else:

                        children = [ ( HydrusData.GetHammingDistance( phash, child_phash ), child_id, child_phash ) for ( child_id, child_phash ) in children ]

                        children.sort()

                        median_index = len( children ) / 2

                        radius = children[ median_index ][0]

                        inner_children = [ ( child_id, child_phash ) for ( distance, child_id, child_phash ) in children if distance <= radius ]
                        outer_children = [ ( child_id, child_phash ) for ( distance, child_id, child_phash ) in children if distance > radius ]

                        inner_population =  len( inner_children )
                        outer_population =  len( outer_children )

                        ( inner_id, inner_phash ) = HydrusData.MedianPop( inner_children )

                        if len( outer_children ) == 0:

                            outer_id = None

                        else:

                            ( outer_id, outer_phash ) = HydrusData.MedianPop( outer_children )


                    insert_rows.append( ( phash_id, parent_id, radius, inner_id, inner_population, outer_id, outer_population ) )

                    if inner_id is not None:

                        process_queue.append( ( phash_id, inner_id, inner_phash, inner_children ) )


                    if outer_id is not None:

                        process_queue.append( ( phash_id, outer_id, outer_phash, outer_children ) )


                    num_done += 1


                self._controller.pub( 'splash_set_status_text', prefix + 'committing' )

                self._c.executemany( 'INSERT INTO shape_vptree ( phash_id, parent_id, radius, inner_id, inner_population, outer_id, outer_population ) VALUES ( ?, ?, ?, ?, ?, ?, ? );', insert_rows )


        if version == 236:

            self._controller.pub( 'splash_set_status_text', 'updating local files services' )

            # update existing services

            self._c.execute( 'UPDATE services SET name = ? WHERE service_key = ?;', ( 'my files', sqlite3.Binary( CC.LOCAL_FILE_SERVICE_KEY ) ) )

            self._c.execute( 'UPDATE services SET service_type = ? WHERE service_key = ?;', ( HC.LOCAL_FILE_TRASH_DOMAIN, sqlite3.Binary( CC.TRASH_SERVICE_KEY ) ) )

            # create new umbrella service that represents if we have the file or not locally

            self._AddService( CC.COMBINED_LOCAL_FILE_SERVICE_KEY, HC.COMBINED_LOCAL_FILE, CC.COMBINED_LOCAL_FILE_SERVICE_KEY, {} )

            combined_local_file_service_id = self._GetServiceId( CC.COMBINED_LOCAL_FILE_SERVICE_KEY )
            local_file_service_id = self._GetServiceId( CC.LOCAL_FILE_SERVICE_KEY )
            trash_service_id = self._GetServiceId( CC.TRASH_SERVICE_KEY )

            # copy all local/trash records to the new umbrella service, and move deleted_files and pending_files responsibility over

            rows = self._c.execute( 'SELECT hash_id, timestamp FROM current_files WHERE service_id IN ( ?, ? );', ( local_file_service_id, trash_service_id ) ).fetchall()

            self._c.executemany( 'INSERT OR IGNORE INTO current_files VALUES ( ?, ?, ? );', ( ( combined_local_file_service_id, hash_id, timestamp ) for ( hash_id, timestamp ) in rows ) )

            self._c.execute( 'UPDATE deleted_files SET service_id = ? WHERE service_id = ?;', ( combined_local_file_service_id, local_file_service_id ) )

            self._c.execute( 'DELETE FROM service_info WHERE service_id = ? AND info_type = ?;', ( local_file_service_id, HC.SERVICE_INFO_NUM_DELETED_FILES ) )

            self._c.execute( 'UPDATE file_transfers SET service_id = ? WHERE service_id = ?;', ( combined_local_file_service_id, local_file_service_id ) )

            # now it has files, refresh the ac cache

            self._controller.pub( 'splash_set_status_text', 'creating autocomplete cache for new service' )

            tag_service_ids = self._GetServiceIds( HC.TAG_SERVICES )

            for tag_service_id in tag_service_ids:

                self._CacheSpecificMappingsDrop( combined_local_file_service_id, tag_service_id )

                self._CacheSpecificMappingsGenerate( combined_local_file_service_id, tag_service_id )


            # trash current_files rows can now have their own timestamp

            trash_rows = self._c.execute( 'SELECT hash_id, timestamp FROM file_trash;' ).fetchall()

            self._c.executemany( 'UPDATE current_files SET timestamp = ? WHERE service_id = ? AND hash_id = ?;', ( ( timestamp, trash_service_id, hash_id ) for ( hash_id, timestamp ) in rows ) )

            self._c.execute( 'DROP TABLE file_trash;' )

            message = 'I have fixed an important miscounting bug in the autocomplete cache. Please go database->maintenance->regenerate autocomplete cache when it is convenient.'

            self.pub_initial_message( message )


        if version == 239:

            self._c.execute( 'DROP TABLE analyze_timestamps;' )

            self._c.execute( 'CREATE TABLE analyze_timestamps ( name TEXT, num_rows INTEGER, timestamp INTEGER );' )

            #

            self._controller.pub( 'splash_set_status_text', 'setting up next step of similar files stuff' )

            self._c.execute( 'CREATE TABLE external_caches.shape_search_cache ( hash_id INTEGER PRIMARY KEY, searched_distance INTEGER );' )

            self._c.execute( 'CREATE TABLE external_caches.duplicate_pairs ( smaller_hash_id INTEGER, larger_hash_id INTEGER, duplicate_type INTEGER, PRIMARY KEY( smaller_hash_id, larger_hash_id ) );' )
            self._c.execute( 'CREATE UNIQUE INDEX external_caches.duplicate_pairs_reversed_hash_ids ON duplicate_pairs ( larger_hash_id, smaller_hash_id );' )

            combined_local_file_service_id = self._GetServiceId( CC.COMBINED_LOCAL_FILE_SERVICE_KEY )

            self._c.execute( 'INSERT OR IGNORE INTO shape_search_cache SELECT hash_id, NULL FROM current_files, files_info USING ( hash_id ) WHERE service_id = ? and mime IN ' + HydrusData.SplayListForDB( HC.MIMES_WE_CAN_PHASH ) + ';', ( combined_local_file_service_id, ) )


        self._controller.pub( 'splash_set_title_text', 'updated db to v' + str( version + 1 ) )

        self._c.execute( 'UPDATE version SET version = ?;', ( version + 1, ) )


    def _UpdateImageboards( self, site_edit_log ):

        for ( site_action, site_data ) in site_edit_log:

            if site_action == HC.ADD:

                site_name = site_data

                self._GetSiteId( site_name )

            elif site_action == HC.DELETE:

                site_name = site_data

                site_id = self._GetSiteId( site_name )

                self._c.execute( 'DELETE FROM imageboard_sites WHERE site_id = ?;', ( site_id, ) )
                self._c.execute( 'DELETE FROM imageboards WHERE site_id = ?;', ( site_id, ) )

            elif site_action == HC.EDIT:

                ( site_name, edit_log ) = site_data

                site_id = self._GetSiteId( site_name )

                for ( action, data ) in edit_log:

                    if action == HC.ADD:

                        name = data

                        imageboard = ClientData.Imageboard( name, '', 60, [], {} )

                        self._c.execute( 'INSERT INTO imageboards ( site_id, name, imageboard ) VALUES ( ?, ?, ? );', ( site_id, name, imageboard ) )

                    elif action == HC.DELETE:

                        name = data

                        self._c.execute( 'DELETE FROM imageboards WHERE site_id = ? AND name = ?;', ( site_id, name ) )

                    elif action == HC.EDIT:

                        imageboard = data

                        name = imageboard.GetName()

                        self._c.execute( 'UPDATE imageboards SET imageboard = ? WHERE site_id = ? AND name = ?;', ( imageboard, site_id, name ) )


    def _UpdateMappings( self, tag_service_id, mappings_ids = None, deleted_mappings_ids = None, pending_mappings_ids = None, pending_rescinded_mappings_ids = None, petitioned_mappings_ids = None, petitioned_rescinded_mappings_ids = None ):

        ( current_mappings_table_name, deleted_mappings_table_name, pending_mappings_table_name, petitioned_mappings_table_name ) = GenerateMappingsTableNames( tag_service_id )

        if mappings_ids is None: mappings_ids = []
        if deleted_mappings_ids is None: deleted_mappings_ids = []
        if pending_mappings_ids is None: pending_mappings_ids = []
        if pending_rescinded_mappings_ids is None: pending_rescinded_mappings_ids = []
        if petitioned_mappings_ids is None: petitioned_mappings_ids = []
        if petitioned_rescinded_mappings_ids is None: petitioned_rescinded_mappings_ids = []

        file_service_ids = self._GetServiceIds( HC.AUTOCOMPLETE_CACHE_SPECIFIC_FILE_SERVICES )

        # this method grew into a monster that merged deleted, pending and current according to a hierarchy of services
        # this cost a lot of CPU time and was extremely difficult to maintain
        # now it attempts a simpler union, not letting delete overwrite a current or pending

        other_service_ids = [ service_id for service_id in self._GetServiceIds( HC.TAG_SERVICES ) if service_id != tag_service_id ]

        splayed_other_service_ids = HydrusData.SplayListForDB( other_service_ids )

        change_in_num_mappings = 0
        change_in_num_deleted_mappings = 0
        change_in_num_pending_mappings = 0
        change_in_num_petitioned_mappings = 0
        change_in_num_tags = 0
        change_in_num_files = 0

        all_adds = mappings_ids + pending_mappings_ids

        tag_ids_being_added = { tag_id for ( namespace_id, tag_id, hash_ids ) in all_adds }

        hash_ids_lists = [ hash_ids for ( namespace_id, tag_id, hash_ids ) in all_adds ]
        hash_ids_being_added = { hash_id for hash_id in itertools.chain.from_iterable( hash_ids_lists ) }

        all_removes = deleted_mappings_ids + pending_rescinded_mappings_ids

        tag_ids_being_removed = { tag_id for ( namespace_id, tag_id, hash_ids ) in all_removes }

        hash_ids_lists = [ hash_ids for ( namespace_id, tag_id, hash_ids ) in all_removes ]
        hash_ids_being_removed = { hash_id for hash_id in itertools.chain.from_iterable( hash_ids_lists ) }

        tag_ids_to_search_for = tag_ids_being_added.union( tag_ids_being_removed )
        hash_ids_to_search_for = hash_ids_being_added.union( hash_ids_being_removed )

        self._c.execute( 'CREATE TABLE mem.temp_tag_ids ( tag_id INTEGER );' )
        self._c.execute( 'CREATE TABLE mem.temp_hash_ids ( hash_id INTEGER );' )

        self._c.executemany( 'INSERT INTO temp_tag_ids ( tag_id ) VALUES ( ? );', ( ( tag_id, ) for tag_id in tag_ids_to_search_for ) )
        self._c.executemany( 'INSERT INTO temp_hash_ids ( hash_id ) VALUES ( ? );', ( ( hash_id, ) for hash_id in hash_ids_to_search_for ) )

        pre_existing_tag_ids = { tag_id for ( tag_id, ) in self._c.execute( 'SELECT tag_id as t FROM temp_tag_ids WHERE EXISTS ( SELECT 1 FROM ' + current_mappings_table_name + ' WHERE tag_id = t );' ) }
        pre_existing_hash_ids = { hash_id for ( hash_id, ) in self._c.execute( 'SELECT hash_id as h FROM temp_hash_ids WHERE EXISTS ( SELECT 1 FROM ' + current_mappings_table_name + ' WHERE hash_id = h );' ) }

        num_tags_added = len( tag_ids_being_added.difference( pre_existing_tag_ids ) )
        num_files_added = len( hash_ids_being_added.difference( pre_existing_hash_ids ) )

        change_in_num_tags += num_tags_added
        change_in_num_files += num_files_added

        combined_files_current_counter = collections.Counter()
        combined_files_pending_counter = collections.Counter()

        if len( mappings_ids ) > 0:

            for ( namespace_id, tag_id, hash_ids ) in mappings_ids:

                splayed_hash_ids = HydrusData.SplayListForDB( hash_ids )

                self._c.execute( 'DELETE FROM ' + deleted_mappings_table_name + ' WHERE namespace_id = ? AND tag_id = ? AND hash_id IN ' + splayed_hash_ids + ';', ( namespace_id, tag_id ) )

                num_deleted_deleted = self._GetRowCount()

                self._c.execute( 'DELETE FROM ' + pending_mappings_table_name + ' WHERE namespace_id = ? AND tag_id = ? AND hash_id IN ' + splayed_hash_ids + ';', ( namespace_id, tag_id ) )

                num_pending_deleted = self._GetRowCount()

                self._c.executemany( 'INSERT OR IGNORE INTO ' + current_mappings_table_name + ' VALUES ( ?, ?, ? );', [ ( namespace_id, tag_id, hash_id ) for hash_id in hash_ids ] )

                num_current_inserted = self._GetRowCount()

                change_in_num_deleted_mappings -= num_deleted_deleted
                change_in_num_pending_mappings -= num_pending_deleted
                change_in_num_mappings += num_current_inserted

                combined_files_pending_counter[ ( namespace_id, tag_id ) ] -= num_pending_deleted
                combined_files_current_counter[ ( namespace_id, tag_id ) ] += num_current_inserted


            for file_service_id in file_service_ids:

                self._CacheSpecificMappingsAddMappings( file_service_id, tag_service_id, mappings_ids )


        if len( deleted_mappings_ids ) > 0:

            for ( namespace_id, tag_id, hash_ids ) in deleted_mappings_ids:

                splayed_hash_ids = HydrusData.SplayListForDB( hash_ids )

                self._c.execute( 'DELETE FROM ' + current_mappings_table_name + ' WHERE namespace_id = ? AND tag_id = ? AND hash_id IN ' + splayed_hash_ids + ';', ( namespace_id, tag_id ) )

                num_current_deleted = self._GetRowCount()

                self._c.execute( 'DELETE FROM ' + petitioned_mappings_table_name + ' WHERE namespace_id = ? AND tag_id = ? AND hash_id IN ' + splayed_hash_ids + ';', ( namespace_id, tag_id ) )

                num_petitions_deleted = self._GetRowCount()

                self._c.executemany( 'INSERT OR IGNORE INTO ' + deleted_mappings_table_name + ' VALUES ( ?, ?, ? );', [ ( namespace_id, tag_id, hash_id ) for hash_id in hash_ids ] )

                num_deleted_inserted = self._GetRowCount()

                change_in_num_mappings -= num_current_deleted
                change_in_num_petitioned_mappings -= num_petitions_deleted
                change_in_num_deleted_mappings += num_deleted_inserted

                combined_files_current_counter[ ( namespace_id, tag_id ) ] -= num_current_deleted


            for file_service_id in file_service_ids:

                self._CacheSpecificMappingsDeleteMappings( file_service_id, tag_service_id, deleted_mappings_ids )


        if len( pending_mappings_ids ) > 0:

            culled_pending_mappings_ids = []

            for ( namespace_id, tag_id, hash_ids ) in pending_mappings_ids:

                with HydrusDB.TemporaryIntegerTable( self._c, hash_ids, 'hash_id' ) as temp_table_name:

                    existing_current_hash_ids = { hash_id for ( hash_id, ) in self._c.execute( 'SELECT hash_id FROM ' + temp_table_name + ', ' + current_mappings_table_name + ' USING ( hash_id ) WHERE namespace_id = ? AND tag_id = ?;', ( namespace_id, tag_id ) ) }


                valid_hash_ids = set( hash_ids ).difference( existing_current_hash_ids )

                culled_pending_mappings_ids.append( ( namespace_id, tag_id, valid_hash_ids ) )


            pending_mappings_ids = culled_pending_mappings_ids

            for ( namespace_id, tag_id, hash_ids ) in pending_mappings_ids:

                self._c.executemany( 'INSERT OR IGNORE INTO ' + pending_mappings_table_name + ' VALUES ( ?, ?, ? );', [ ( namespace_id, tag_id, hash_id ) for hash_id in hash_ids ] )

                num_pending_inserted = self._GetRowCount()

                change_in_num_pending_mappings += num_pending_inserted

                combined_files_pending_counter[ ( namespace_id, tag_id ) ] += num_pending_inserted


            for file_service_id in file_service_ids:

                self._CacheSpecificMappingsPendMappings( file_service_id, tag_service_id, pending_mappings_ids )


        if len( pending_rescinded_mappings_ids ) > 0:

            for ( namespace_id, tag_id, hash_ids ) in pending_rescinded_mappings_ids:

                self._c.execute( 'DELETE FROM ' + pending_mappings_table_name + ' WHERE namespace_id = ? AND tag_id = ? AND hash_id IN ' + HydrusData.SplayListForDB( hash_ids ) + ';', ( namespace_id, tag_id ) )

                num_pending_deleted = self._GetRowCount()

                change_in_num_pending_mappings -= num_pending_deleted

                combined_files_pending_counter[ ( namespace_id, tag_id ) ] -= num_pending_deleted


            for file_service_id in file_service_ids:

                self._CacheSpecificMappingsRescindPendingMappings( file_service_id, tag_service_id, pending_rescinded_mappings_ids )


        combined_files_seen_ids = set( ( key for ( key, value ) in combined_files_current_counter.items() if value != 0 ) )
        combined_files_seen_ids.update( ( key for ( key, value ) in combined_files_pending_counter.items() if value != 0 ) )

        combined_files_counts = [ ( namespace_id, tag_id, combined_files_current_counter[ ( namespace_id, tag_id ) ], combined_files_pending_counter[ ( namespace_id, tag_id ) ] ) for ( namespace_id, tag_id ) in combined_files_seen_ids ]

        self._CacheCombinedFilesMappingsUpdate( tag_service_id, combined_files_counts )

        #

        post_existing_tag_ids = { tag_id for ( tag_id, ) in self._c.execute( 'SELECT tag_id as t FROM temp_tag_ids WHERE EXISTS ( SELECT 1 FROM ' + current_mappings_table_name + ' WHERE tag_id = t );' ) }
        post_existing_hash_ids = { hash_id for ( hash_id, ) in self._c.execute( 'SELECT hash_id as h FROM temp_hash_ids WHERE EXISTS ( SELECT 1 FROM ' + current_mappings_table_name + ' WHERE hash_id = h );' ) }

        self._c.execute( 'DROP TABLE temp_tag_ids;' )
        self._c.execute( 'DROP TABLE temp_hash_ids;' )

        num_tags_removed = len( pre_existing_tag_ids.intersection( tag_ids_being_removed ).difference( post_existing_tag_ids ) )
        num_files_removed = len( pre_existing_hash_ids.intersection( hash_ids_being_removed ).difference( post_existing_hash_ids ) )

        change_in_num_tags -= num_tags_removed
        change_in_num_files -= num_files_removed

        for ( namespace_id, tag_id, hash_ids, reason_id ) in petitioned_mappings_ids:

            self._c.executemany( 'INSERT OR IGNORE INTO ' + petitioned_mappings_table_name + ' VALUES ( ?, ?, ?, ? );', [ ( namespace_id, tag_id, hash_id, reason_id ) for hash_id in hash_ids ] )

            num_petitions_inserted = self._GetRowCount()

            change_in_num_petitioned_mappings += num_petitions_inserted


        for ( namespace_id, tag_id, hash_ids ) in petitioned_rescinded_mappings_ids:

            self._c.execute( 'DELETE FROM ' + petitioned_mappings_table_name + ' WHERE namespace_id = ? AND tag_id = ? AND hash_id IN ' + HydrusData.SplayListForDB( hash_ids ) + ';', ( namespace_id, tag_id ) )

            num_petitions_deleted = self._GetRowCount()

            change_in_num_petitioned_mappings -= num_petitions_deleted


        service_info_updates = []

        if change_in_num_mappings != 0: service_info_updates.append( ( change_in_num_mappings, tag_service_id, HC.SERVICE_INFO_NUM_MAPPINGS ) )
        if change_in_num_deleted_mappings != 0: service_info_updates.append( ( change_in_num_deleted_mappings, tag_service_id, HC.SERVICE_INFO_NUM_DELETED_MAPPINGS ) )
        if change_in_num_pending_mappings != 0: service_info_updates.append( ( change_in_num_pending_mappings, tag_service_id, HC.SERVICE_INFO_NUM_PENDING_MAPPINGS ) )
        if change_in_num_petitioned_mappings != 0: service_info_updates.append( ( change_in_num_petitioned_mappings, tag_service_id, HC.SERVICE_INFO_NUM_PETITIONED_MAPPINGS ) )
        if change_in_num_tags != 0: service_info_updates.append( ( change_in_num_tags, tag_service_id, HC.SERVICE_INFO_NUM_TAGS ) )
        if change_in_num_files != 0: service_info_updates.append( ( change_in_num_files, tag_service_id, HC.SERVICE_INFO_NUM_FILES ) )

        if len( service_info_updates ) > 0: self._c.executemany( 'UPDATE service_info SET info = info + ? WHERE service_id = ? AND info_type = ?;', service_info_updates )


    def _UpdateServerServices( self, admin_service_key, original_services_info, edit_log, service_keys_to_access_keys ):

        self._c.execute( 'COMMIT;' )

        if not self._fast_big_transaction_wal:

            self._c.execute( 'PRAGMA journal_mode = TRUNCATE;' )


        self._c.execute( 'PRAGMA foreign_keys = ON;' )

        self._c.execute( 'BEGIN IMMEDIATE;' )

        self.pub_after_commit( 'notify_new_services_data' )
        self.pub_after_commit( 'notify_new_services_gui' )

        admin_service_id = self._GetServiceId( admin_service_key )

        admin_service = self._GetService( admin_service_id )

        admin_info = admin_service.GetInfo()

        host = admin_info[ 'host' ]

        #

        server_service_keys_to_client_service_info = {}

        current_client_services_info = self._c.execute( 'SELECT service_key, service_type, info FROM services;' ).fetchall()

        for ( server_service_key, service_type, server_options ) in original_services_info:

            server_port = server_options[ 'port' ]

            for ( client_service_key, service_type, client_info ) in current_client_services_info:

                if 'host' in client_info and 'port' in client_info:

                    if client_info[ 'host' ] == host and client_info[ 'port' ] == server_port:

                        server_service_keys_to_client_service_info[ server_service_key ] = ( client_service_key, service_type, client_info )


        #

        for ( action, data ) in edit_log:

            if action == HC.ADD:

                ( service_key, service_type, server_options ) = data

                info = {}

                info[ 'host' ] = host
                info[ 'port' ] = server_options[ 'port' ]
                info[ 'access_key' ] = service_keys_to_access_keys[ service_key ]

                name = HC.service_string_lookup[ service_type ] + ' at ' + host + ':' + str( info[ 'port' ] )

                self._AddService( service_key, service_type, name, info )

            elif action == HC.DELETE:

                server_service_key = data

                if server_service_key in server_service_keys_to_client_service_info:

                    ( client_service_key, service_type, client_info ) = server_service_keys_to_client_service_info[ server_service_key ]

                    service_id = self._GetServiceId( client_service_key )

                    self._DeleteService( service_id )


            elif action == HC.EDIT:

                ( server_service_key, service_type, server_options ) = data

                if server_service_key in server_service_keys_to_client_service_info:

                    ( client_service_key, service_type, client_info ) = server_service_keys_to_client_service_info[ server_service_key ]

                    service_id = self._GetServiceId( client_service_key )

                    client_info[ 'port' ] = server_options[ 'port' ]

                    self._c.execute( 'UPDATE services SET info = ? WHERE service_id = ?;', ( client_info, service_id ) )


        self.pub_after_commit( 'notify_new_pending' )

        self._c.execute( 'COMMIT;' )

        self._InitDBCursor()

        self._c.execute( 'BEGIN IMMEDIATE;' )


    def _UpdateServices( self, edit_log ):

        self._c.execute( 'COMMIT;' )

        if not self._fast_big_transaction_wal:

            self._c.execute( 'PRAGMA journal_mode = TRUNCATE;' )


        self._c.execute( 'PRAGMA foreign_keys = ON;' )

        self._c.execute( 'BEGIN IMMEDIATE;' )

        self.pub_after_commit( 'notify_new_services_data' )
        self.pub_after_commit( 'notify_new_services_gui' )

        for entry in edit_log:

            action = entry.GetAction()

            if action == HC.ADD:

                ( service_key, service_type, name, info ) = entry.GetData()

                self._AddService( service_key, service_type, name, info )

            elif action == HC.DELETE:

                service_key = entry.GetIdentifier()

                service_id = self._GetServiceId( service_key )

                self._DeleteService( service_id )

            elif action == HC.EDIT:

                ( service_key, service_type, new_name, info_update ) = entry.GetData()

                service_id = self._GetServiceId( service_key )

                self._c.execute( 'UPDATE services SET name = ? WHERE service_id = ?;', ( new_name, service_id ) )

                if service_type in HC.RESTRICTED_SERVICES:

                    account = HydrusData.GetUnknownAccount()

                    account.MakeStale()

                    info_update[ 'account' ] = account

                    self.pub_after_commit( 'permissions_are_stale' )

                    session_manager = HydrusGlobals.client_controller.GetClientSessionManager()

                    session_manager.DeleteSessionKey( service_key )


                if service_type in HC.TAG_SERVICES:

                    ( old_info, ) = self._c.execute( 'SELECT info FROM services WHERE service_id = ?;', ( service_id, ) ).fetchone()

                    old_tag_archive_sync = old_info[ 'tag_archive_sync' ]
                    new_tag_archive_sync = info_update[ 'tag_archive_sync' ]

                    for portable_hta_path in new_tag_archive_sync.keys():

                        namespaces = set( new_tag_archive_sync[ portable_hta_path ] )

                        if portable_hta_path in old_tag_archive_sync:

                            old_namespaces = old_tag_archive_sync[ portable_hta_path ]

                            namespaces.difference_update( old_namespaces )

                            if len( namespaces ) == 0:

                                continue


                        hta_path = HydrusPaths.ConvertPortablePathToAbsPath( portable_hta_path )

                        file_service_key = CC.LOCAL_FILE_SERVICE_KEY

                        adding = True

                        self._controller.pub( 'sync_to_tag_archive', hta_path, service_key, file_service_key, adding, namespaces )


                self._UpdateServiceInfo( service_id, info_update )

                if service_id in self._service_cache: del self._service_cache[ service_id ]

                if service_type == HC.LOCAL_BOORU:

                    self.pub_after_commit( 'restart_booru' )
                    self.pub_after_commit( 'notify_new_upnp_mappings' )


        self.pub_after_commit( 'notify_new_pending' )

        self._c.execute( 'COMMIT;' )

        self._InitDBCursor()

        self._c.execute( 'BEGIN IMMEDIATE;' )


    def _UpdateServiceInfo( self, service_id, update ):

        ( info, ) = self._c.execute( 'SELECT info FROM services WHERE service_id = ?;', ( service_id, ) ).fetchone()

        for ( k, v ) in update.items(): info[ k ] = v

        self._c.execute( 'UPDATE services SET info = ? WHERE service_id = ?;', ( info, service_id ) )


    def _Vacuum( self, stop_time = None, force_vacuum = False ):

        new_options = self._controller.GetNewOptions()

        maintenance_vacuum_period_days = new_options.GetNoneableInteger( 'maintenance_vacuum_period_days' )

        if maintenance_vacuum_period_days is None:

            return


        stale_time_delta = maintenance_vacuum_period_days * 86400

        existing_names_to_timestamps = dict( self._c.execute( 'SELECT name, timestamp FROM vacuum_timestamps;' ).fetchall() )

        db_names = [ name for ( index, name, path ) in self._c.execute( 'PRAGMA database_list;' ) if name not in ( 'mem', 'temp' ) ]

        if force_vacuum:

            due_names = db_names

        else:

            due_names = [ name for name in db_names if name not in existing_names_to_timestamps or HydrusData.TimeHasPassed( existing_names_to_timestamps[ name ] + stale_time_delta ) ]


        if len( due_names ) > 0:

            self._c.execute( 'COMMIT;' )

            job_key_pubbed = False

            job_key = ClientThreading.JobKey()

            job_key.SetVariable( 'popup_title', 'database maintenance - vacuum' )

            self._CloseDBCursor()

            try:

                time.sleep( 1 )

                names_done = []

                for name in due_names:

                    try:

                        db_path = os.path.join( self._db_dir, self._db_filenames[ name ] )

                        if HydrusDB.CanVacuum( db_path, stop_time = stop_time ):

                            if not job_key_pubbed:

                                self._controller.pub( 'message', job_key )

                                job_key_pubbed = True


                            self._controller.pub( 'splash_set_status_text', 'vacuuming ' + name )
                            job_key.SetVariable( 'popup_text_1', 'vacuuming ' + name )

                            started = HydrusData.GetNowPrecise()

                            HydrusDB.VacuumDB( db_path )

                            time_took = HydrusData.GetNowPrecise() - started

                            HydrusData.Print( 'Vacuumed ' + db_path + ' in ' + HydrusData.ConvertTimeDeltaToPrettyString( time_took ) )

                            names_done.append( name )


                    except Exception as e:

                        HydrusData.Print( 'vacuum failed:' )

                        HydrusData.ShowException( e )

                        size = os.path.getsize( db_path )

                        pretty_size = HydrusData.ConvertIntToBytes( size )

                        text = 'An attempt to vacuum the database failed.'
                        text += os.linesep * 2
                        text += 'For now, automatic vacuuming has been disabled. If the error is not obvious, please contact the hydrus developer.'

                        HydrusData.ShowText( text )

                        self._InitDBCursor()

                        self._c.execute( 'BEGIN IMMEDIATE;' )

                        new_options.SetNoneableInteger( 'maintenance_vacuum_period_days', None )

                        self._SaveOptions( HC.options )

                        return


                job_key.SetVariable( 'popup_text_1', 'cleaning up' )

            finally:

                self._InitDBCursor()

                self._c.execute( 'BEGIN IMMEDIATE;' )

                self._c.executemany( 'DELETE FROM vacuum_timestamps WHERE name = ?;', ( ( name, ) for name in names_done ) )

                self._c.executemany( 'INSERT OR IGNORE INTO vacuum_timestamps ( name, timestamp ) VALUES ( ?, ? );', ( ( name, HydrusData.GetNow() ) for name in names_done ) )

                job_key.SetVariable( 'popup_text_1', 'done!' )

                job_key.Delete( 30 )


    def _Write( self, action, *args, **kwargs ):

        if action == 'analyze': result = self._AnalyzeStaleBigTables( *args, **kwargs )
        elif action == 'backup': result = self._Backup( *args, **kwargs )
        elif action == 'content_update_package':result = self._ProcessContentUpdatePackage( *args, **kwargs )
        elif action == 'content_updates':result = self._ProcessContentUpdates( *args, **kwargs )
        elif action == 'db_integrity': result = self._CheckDBIntegrity( *args, **kwargs )
        elif action == 'delete_hydrus_session_key': result = self._DeleteHydrusSessionKey( *args, **kwargs )
        elif action == 'delete_imageboard': result = self._DeleteYAMLDump( YAML_DUMP_ID_IMAGEBOARD, *args, **kwargs )
        elif action == 'delete_local_booru_share': result = self._DeleteYAMLDump( YAML_DUMP_ID_LOCAL_BOORU, *args, **kwargs )
        elif action == 'delete_pending': result = self._DeletePending( *args, **kwargs )
        elif action == 'delete_remote_booru': result = self._DeleteYAMLDump( YAML_DUMP_ID_REMOTE_BOORU, *args, **kwargs )
        elif action == 'delete_serialisable_named': result = self._DeleteJSONDumpNamed( *args, **kwargs )
        elif action == 'delete_service_info': result = self._DeleteServiceInfo( *args, **kwargs )
        elif action == 'export_mappings': result = self._ExportToTagArchive( *args, **kwargs )
        elif action == 'file_integrity': result = self._CheckFileIntegrity( *args, **kwargs )
        elif action == 'hydrus_session': result = self._AddHydrusSession( *args, **kwargs )
        elif action == 'imageboard': result = self._SetYAMLDump( YAML_DUMP_ID_IMAGEBOARD, *args, **kwargs )
        elif action == 'import_file': result = self._ImportFile( *args, **kwargs )
        elif action == 'local_booru_share': result = self._SetYAMLDump( YAML_DUMP_ID_LOCAL_BOORU, *args, **kwargs )
        elif action == 'maintain_similar_files_tree': result = self._CacheSimilarFilesMaintainTree( *args, **kwargs )
        elif action == 'push_recent_tags': result = self._PushRecentTags( *args, **kwargs )
        elif action == 'regenerate_ac_cache': result = self._RegenerateACCache( *args, **kwargs )
        elif action == 'regenerate_similar_files': result = self._CacheSimilarFilesRegenerateTree( *args, **kwargs )
        elif action == 'relocate_client_files': result = self._RelocateClientFiles( *args, **kwargs )
        elif action == 'remote_booru': result = self._SetYAMLDump( YAML_DUMP_ID_REMOTE_BOORU, *args, **kwargs )
        elif action == 'reset_service': result = self._ResetService( *args, **kwargs )
        elif action == 'save_options': result = self._SaveOptions( *args, **kwargs )
        elif action == 'serialisable_simple': result = self._SetJSONSimple( *args, **kwargs )
        elif action == 'serialisable': result = self._SetJSONDump( *args, **kwargs )
        elif action == 'serialisables_overwrite': result = self._OverwriteJSONDumps( *args, **kwargs )
        elif action == 'service_updates': result = self._ProcessServiceUpdates( *args, **kwargs )
        elif action == 'set_password': result = self._SetPassword( *args, **kwargs )
        elif action == 'sync_hashes_to_tag_archive': result = self._SyncHashesToTagArchive( *args, **kwargs )
        elif action == 'tag_censorship': result = self._SetTagCensorship( *args, **kwargs )
        elif action == 'update_server_services': result = self._UpdateServerServices( *args, **kwargs )
        elif action == 'update_services': result = self._UpdateServices( *args, **kwargs )
        elif action == 'vacuum': result = self._Vacuum( *args, **kwargs )
        elif action == 'web_session': result = self._AddWebSession( *args, **kwargs )
        else: raise Exception( 'db received an unknown write command: ' + action )

        return result


    def pub_content_updates_after_commit( self, service_keys_to_content_updates ):

        self.pub_after_commit( 'content_updates_data', service_keys_to_content_updates )
        self.pub_after_commit( 'content_updates_gui', service_keys_to_content_updates )


    def pub_initial_message( self, message ):

        self._initial_messages.append( message )


    def pub_service_updates_after_commit( self, service_keys_to_service_updates ):

        self.pub_after_commit( 'service_updates_data', service_keys_to_service_updates )
        self.pub_after_commit( 'service_updates_gui', service_keys_to_service_updates )


    def GetInitialMessages( self ):

        return self._initial_messages


    def GetUpdatesDir( self ):

        return self._updates_dir


    def RestoreBackup( self, path ):

        for filename in self._db_filenames.values():

            source = os.path.join( path, filename )
            dest = os.path.join( self._db_dir, filename )

            if os.path.exists( source ):

                HydrusPaths.MirrorFile( source, dest )

            else:

                # if someone backs up with an older version that does not have as many db files as this version, we get conflict
                # don't want to delete just in case, but we will move it out the way

                HydrusPaths.MergeFile( dest, dest + '.old' )


        client_files_source = os.path.join( path, 'client_files' )
        client_files_default = os.path.join( self._db_dir, 'client_files' )

        if os.path.exists( client_files_source ):

            HydrusPaths.MirrorTree( client_files_source, client_files_default )


        HydrusPaths.MirrorTree( os.path.join( path, 'client_updates' ), self._updates_dir )