azure - DocumentDB - 查询结果顺序

标签 azure azure-cosmosdb

我正在使用 Azure DocumentDB 来存储有关用户的信息。这些文档包含一个名为date_created的属性。我想向 documentDB 发送查询以检索存储在该集合中的所有用户。我还希望结果按从最新到最旧的顺序排列。

我目前在 DocumentDB 中实现了一个存储过程,它遍历集合并根据日期属性对结果进行排序。不过,我有两个问题:

  1. 当查询返回多个文档时,DocumentDB 使用的默认顺序是什么?
  2. 我知道 DocumentDB 尚不支持排序控制,但如果我使用存储过程对结果进行排序,我是否正在执行完整的集合扫描,或者数据库是否至少利用属性的索引我正在排序?作为引用,我使用的存储过程是这个(根据产品团队提供的 Azure 示例稍作修改):

    function orderBy(filterQuery, orderByFieldName, continuationToken) { 
    // HTTP error codes sent to our callback funciton by DocDB server. 
    var ErrorCode = { 
        REQUEST_ENTITY_TOO_LARGE: 413, 
    }
    var collection = getContext().getCollection(); 
    var collectionLink = collection.getSelfLink(); 
    var result = new Array(); 
    
    tryQuery({}); 
    
    function tryQuery(options) { 
        var isAccepted = (filterQuery && filterQuery.length) ? 
            collection.queryDocuments(collectionLink, filterQuery, options, callback) : 
            collection.readDocuments(collectionLink, options, callback) 
    
        if (!isAccepted) throw new Error("Source dataset is too large to complete the operation."); 
    } 
    
    /** 
    * queryDocuments callback. 
    * @param {Error} err - Error object in case of error/exception. 
    * @param {Array} queryFeed - array containing results of the query. 
    * @param {ResponseOptions} responseOptions. 
    */ 
    function callback(err, queryFeed, responseOptions) { 
        if (err) { 
            throw err; 
        } 
    
        // Iterate over document feed and store documents into the result array. 
        queryFeed.forEach(function (element, index, array) { 
            result[result.length] = element; 
        }); 
    
        if (responseOptions.continuation) { 
            // If there is continuation, call query again providing continuation token. 
            tryQuery({ continuation: responseOptions.continuation }); 
        } else { 
            // We are done with querying/got all results. Sort the results and return from the script. 
            result.sort(compare); 
    
            fillResponse(); 
        } 
    } 
    
    // Compare two objects(documents) using field specified by the orderByFieldName parameter. 
    // Return 0 if equal, -1 if less, 1 if greater. 
    function compare(x, y) { 
        if (x[orderByFieldName] == y[orderByFieldName]) return 0; 
        else if (x[orderByFieldName] < y[orderByFieldName]) return 1; 
        return -1; 
    } 
    
    // This is called in the very end on an already sorted array. 
    // Sort the results and set the response body. 
    function fillResponse() {
        var page_size = 20;
        // Main script is called with continuationToken which is the index of 1st item to start result batch from. 
        // Slice the result array and discard the beginning. From now on use the 'continuationResult' var. 
        var continuationResult = result; 
        if (continuationToken) continuationResult = result.slice(continuationToken); 
        else continuationToken = 0;
    
        if (page_size > continuationResult.length ) {
            page_size = continuationResult.length;
        }
    
        // Get/initialize the response. 
        var response = getContext().getResponse(); 
        response.setBody(null); 
    
        // Take care of response body getting too large: 
        // Set Response iterating by one element. When we fail due to MAX response size, return to the client requesting continuation. 
        var i = 0;
        var final_result = [];
        for (; i < page_size; ++i) { 
            try { 
                // Note: setBody is very expensive vs appendBody, use appendBody with simple approximation JSON.stringify(element).
                final_result.push(continuationResult[i]);                   
            } catch (ex) { 
                if (!ex.number == ErrorCode.REQUEST_ENTITY_TOO_LARGE) throw ex; 
                break; 
            } 
        } 
    
        /* Now next batch to return to client has i elements. 
        // Slice the continuationResult if needed and discard the end. */
        var partialResult = continuationResult; 
        var newContinuation = null; 
        if (i < continuationResult.length) { 
            partialResult = continuationResult.slice(0, i); 
        }
    
        // Finally, set response body.          
        response.setBody({ result: final_result, continuation: i }); 
    } 
    

    }

最佳答案

更新:截至 2015 年 7 月 - DocumentDB 在查询中支持 ORDER BY

目前,您需要在客户端或存储过程上对集合进行排序(尽管我建议在客户端上这样做,因为存储过程的执行是有限的)。

回答您的问题:

1) 我不相信有保证的默认排序

2) 存储过程将导致集合扫描,然后对其进行排序。

您可以通过在 Azure 反馈论坛上发表意见来帮助插入“排序依据”: http://feedback.azure.com/forums/263030-documentdb/suggestions/6334829--order-by-in-queries

关于azure - DocumentDB - 查询结果顺序,我们在Stack Overflow上找到一个类似的问题: https://stackoverflow.com/questions/27040843/

相关文章:

具有分区文档数据库的 Azure 搜索服务

azure - 通过 join 过滤嵌套列表时是否使用 cosmos 索引?

c# - 如何将文件上传到 blob 存储并从附件中的 cosmosdb 文档引用它

azure - 使用 VPN 连接到 Azure SQL 数据库(点到站点)

azure - 在哪里查看 Azure HDInsight 脚本操作错误日志

按国家/地区排列的 Azure 搜索城市排名(第二个搜索字段)

c# - CosmosDb SDK v3 是否在批量插入时自动重试?

python - 如何为 Python 中的 document_client 对象发送的 Cosmos DB 查询设置连续 token ?

azure - 可以在 Kubernetes 群集上或使用 Azure Kubernetes 服务 (AKS) 预配 SharePoint 2016 场吗?

无法设置 Azure VM DNS 名称标签