GridFS - Фрагментация, производительность и индексы - PullRequest
0 голосов
/ 08 мая 2019

В моем продукте в среде у меня есть миллионы файлов, хранящихся в GridFS;на самом деле мы начинаем удалять их, чтобы освободить место тоже.

Статистика БД:

{ 
    "db" : "Dummy", 
    "collections" : NumberInt(5), 
    "views" : NumberInt(0), 
    "objects" : NumberInt(60344915), 
    "avgObjSize" : 14560.387591033976, 
    "dataSize" : 878645351548.0, 
    "storageSize" : 724202864640.0, 
    "numExtents" : NumberInt(0), 
    "indexes" : NumberInt(7), 
    "indexSize" : 2633293824.0, 
    "ok" : 1.0
}

Статистика коллекций:

{ 
    "ns" : "Dummy.Coll1", 
    "size" : 4708693124.0, 
    "count" : NumberInt(12412954), 
    "avgObjSize" : NumberInt(379), 
    "storageSize" : 1710395392.0, 
    "capped" : false, 
    "nindexes" : NumberInt(1), 
    "indexDetails" : {
        "_id_" : {
            "metadata" : {
                "formatVersion" : NumberInt(8), 
                "infoObj" : "{ \"v\" : 2, \"key\" : { \"_id\" : 1 }, \"name\" : \"_id_\", \"ns\" : \"Dummy.Coll1\" }"
            }, 
            "creationString" : "access_pattern_hint=none,allocation_size=4KB,app_metadata=(formatVersion=8,infoObj={ \"v\" : 2, \"key\" : { \"_id\" : 1 }, \"name\" : \"_id_\", \"ns\" : \"SistemiHubBridge.FattureRicevute\" }),block_allocation=best,block_compressor=,cache_resident=false,checksum=on,colgroups=,collator=,columns=,dictionary=0,encryption=(keyid=,name=),exclusive=false,extractor=,format=btree,huffman_key=,huffman_value=,ignore_in_memory_cache_size=false,immutable=false,internal_item_max=0,internal_key_max=0,internal_key_truncate=true,internal_page_max=16k,key_format=u,key_gap=10,leaf_item_max=0,leaf_key_max=0,leaf_page_max=16k,leaf_value_max=0,log=(enabled=true),lsm=(auto_throttle=true,bloom=true,bloom_bit_count=16,bloom_config=,bloom_hash_count=8,bloom_oldest=false,chunk_count_limit=0,chunk_max=5GB,chunk_size=10MB,merge_max=15,merge_min=0),memory_page_max=5MB,os_cache_dirty_max=0,os_cache_max=0,prefix_compression=true,prefix_compression_min=4,source=,split_deepen_min_child=0,split_deepen_per_child=0,split_pct=90,type=file,value_format=u", 
            "type" : "file", 
            "uri" : "statistics:table:index-10--4068436889899522135", 
            "LSM" : {
                "bloom filter false positives" : NumberInt(0), 
                "bloom filter hits" : NumberInt(0), 
                "bloom filter misses" : NumberInt(0), 
                "bloom filter pages evicted from cache" : NumberInt(0), 
                "bloom filter pages read into cache" : NumberInt(0), 
                "bloom filters in the LSM tree" : NumberInt(0), 
                "chunks in the LSM tree" : NumberInt(0), 
                "highest merge generation in the LSM tree" : NumberInt(0), 
                "queries that could have benefited from a Bloom filter that did not exist" : NumberInt(0), 
                "sleep for LSM checkpoint throttle" : NumberInt(0), 
                "sleep for LSM merge throttle" : NumberInt(0), 
                "total size of bloom filters" : NumberInt(0)
            }, 
            "block-manager" : {
                "allocations requiring file extension" : NumberInt(23804), 
                "blocks allocated" : NumberInt(512341), 
                "blocks freed" : NumberInt(197235), 
                "checkpoint size" : NumberInt(167079936), 
                "file allocation unit size" : NumberInt(4096), 
                "file bytes available for reuse" : NumberInt(1155072), 
                "file magic number" : NumberInt(120897), 
                "file major version number" : NumberInt(1), 
                "file size in bytes" : NumberInt(168251392), 
                "minor version number" : NumberInt(0)
            }, 
            "btree" : {
                "btree checkpoint generation" : NumberInt(104735), 
                "column-store fixed-size leaf pages" : NumberInt(0), 
                "column-store internal pages" : NumberInt(0), 
                "column-store variable-size RLE encoded values" : NumberInt(0), 
                "column-store variable-size deleted values" : NumberInt(0), 
                "column-store variable-size leaf pages" : NumberInt(0), 
                "fixed-record size" : NumberInt(0), 
                "maximum internal page key size" : NumberInt(1474), 
                "maximum internal page size" : NumberInt(16384), 
                "maximum leaf page key size" : NumberInt(1474), 
                "maximum leaf page size" : NumberInt(16384), 
                "maximum leaf page value size" : NumberInt(7372), 
                "maximum tree depth" : NumberInt(4), 
                "number of key/value pairs" : NumberInt(0), 
                "overflow pages" : NumberInt(0), 
                "pages rewritten by compaction" : NumberInt(0), 
                "row-store internal pages" : NumberInt(0), 
                "row-store leaf pages" : NumberInt(0)
            }, 
            "cache" : {
                "bytes currently in the cache" : NumberInt(247269), 
                "bytes read into cache" : NumberInt(31710621), 
                "bytes written from cache" : 2602068426.0, 
                "checkpoint blocked page eviction" : NumberInt(0), 
                "data source pages selected for eviction unable to be evicted" : NumberInt(11), 
                "hazard pointer blocked page eviction" : NumberInt(0), 
                "in-memory page passed criteria to be split" : NumberInt(184), 
                "in-memory page splits" : NumberInt(92), 
                "internal pages evicted" : NumberInt(101), 
                "internal pages split during eviction" : NumberInt(1), 
                "leaf pages split during eviction" : NumberInt(1342), 
                "modified pages evicted" : NumberInt(2843), 
                "overflow pages read into cache" : NumberInt(0), 
                "overflow values cached in memory" : NumberInt(0), 
                "page split during eviction deepened the tree" : NumberInt(1), 
                "page written requiring lookaside records" : NumberInt(0), 
                "pages read into cache" : NumberInt(2608), 
                "pages read into cache requiring lookaside entries" : NumberInt(0), 
                "pages requested from the cache" : NumberInt(12903606), 
                "pages written from cache" : NumberInt(309295), 
                "pages written requiring in-memory restoration" : NumberInt(0), 
                "tracked dirty bytes in the cache" : NumberInt(175139), 
                "unmodified pages evicted" : NumberInt(772)
            }, 
            "cache_walk" : {
                "Average difference between current eviction generation when the page was last considered" : NumberInt(0), 
                "Average on-disk page image size seen" : NumberInt(0), 
                "Clean pages currently in cache" : NumberInt(0), 
                "Current eviction generation" : NumberInt(0), 
                "Dirty pages currently in cache" : NumberInt(0), 
                "Entries in the root page" : NumberInt(0), 
                "Internal pages currently in cache" : NumberInt(0), 
                "Leaf pages currently in cache" : NumberInt(0), 
                "Maximum difference between current eviction generation when the page was last considered" : NumberInt(0), 
                "Maximum page size seen" : NumberInt(0), 
                "Minimum on-disk page image size seen" : NumberInt(0), 
                "On-disk page image sizes smaller than a single allocation unit" : NumberInt(0), 
                "Pages created in memory and never written" : NumberInt(0), 
                "Pages currently queued for eviction" : NumberInt(0), 
                "Pages that could not be queued for eviction" : NumberInt(0), 
                "Refs skipped during cache traversal" : NumberInt(0), 
                "Size of the root page" : NumberInt(0), 
                "Total number of pages currently in cache" : NumberInt(0)
            }, 
            "compression" : {
                "compressed pages read" : NumberInt(0), 
                "compressed pages written" : NumberInt(0), 
                "page written failed to compress" : NumberInt(0), 
                "page written was too small to compress" : NumberInt(0), 
                "raw compression call failed, additional data available" : NumberInt(0), 
                "raw compression call failed, no additional data available" : NumberInt(0), 
                "raw compression call succeeded" : NumberInt(0)
            }, 
            "cursor" : {
                "bulk-loaded cursor-insert calls" : NumberInt(0), 
                "create calls" : NumberInt(8675), 
                "cursor-insert key and value bytes inserted" : NumberInt(220702884), 
                "cursor-remove key bytes removed" : NumberInt(0), 
                "cursor-update value bytes updated" : NumberInt(0), 
                "insert calls" : NumberInt(12267767), 
                "next calls" : NumberInt(0), 
                "prev calls" : NumberInt(0), 
                "remove calls" : NumberInt(0), 
                "reset calls" : NumberInt(12267769), 
                "restarted searches" : NumberInt(243), 
                "search calls" : NumberInt(2), 
                "search near calls" : NumberInt(0), 
                "truncate calls" : NumberInt(0), 
                "update calls" : NumberInt(0)
            }, 
            "reconciliation" : {
                "dictionary matches" : NumberInt(0), 
                "fast-path pages deleted" : NumberInt(0), 
                "internal page key bytes discarded using suffix compression" : NumberInt(16378777), 
                "internal page multi-block writes" : NumberInt(79547), 
                "internal-page overflow keys" : NumberInt(0), 
                "leaf page key bytes discarded using prefix compression" : 14049832267.0, 
                "leaf page multi-block writes" : NumberInt(89248), 
                "leaf-page overflow keys" : NumberInt(0), 
                "maximum blocks required for a page" : NumberInt(2), 
                "overflow values written" : NumberInt(0), 
                "page checksum matches" : NumberInt(1740545), 
                "page reconciliation calls" : NumberInt(288189), 
                "page reconciliation calls for eviction" : NumberInt(67), 
                "pages deleted" : NumberInt(0)
            }, 
            "session" : {
                "object compaction" : NumberInt(0), 
                "open cursor count" : NumberInt(11)
            }, 
            "transaction" : {
                "update conflicts" : NumberInt(0)
            }
        }
    }, 
    "totalIndexSize" : NumberInt(168251392), 
    "indexSizes" : {
        "_id_" : NumberInt(168251392)
    }, 
    "ok" : 1.0
}

Я использую Mongo 3.4.15

После удаления миллиона из них пространство становится более или менее постоянным (учитывая новую вставку), но система начинает медленно работать при новом удалении, я удаляю документы GridFs и обновляю строки, используямассовое обновление.

Может ли эта проблема быть вызвана фрагментацией, вызванной удалением?Должен ли я положить некоторые индексы?Должен ли я выполнить компактную команду?Требуется ли для компакта перевести коллекцию / базу данных в автономный режим или это может быть обычное или плановое обслуживание?

Добро пожаловать на сайт PullRequest, где вы можете задавать вопросы и получать ответы от других членов сообщества.
...