clintropolis commented on PR #16132:
URL: https://github.com/apache/druid/pull/16132#issuecomment-2024678078

   wired up smoosh analysis as an alternative for when size information is 
unavailable, looks something like this:
   ```
   ...
           "smoosh": {
               "__time": 1972740,
               "adblock_list": 264,
               "adblock_list.__encodedColumn": 57684,
               "adblock_list.__stringDictionary": 110,
               "adblock_list.__valueIndexes": 120057,
               "agent": 384,
               "agent.__arrayDictionary": 5,
               "agent.__doubleDictionary": 6,
               "agent.__field_0": 515467,
               "agent.__field_1": 1002327,
               "agent.__field_2": 308161,
               "agent.__field_3": 680152,
               "agent.__field_4": 556802,
               "agent.__field_5": 274419,
               "agent.__longDictionary": 6,
               "agent.__raw": 5,
               "agent.__raw_compressed": 1624491,
               "agent.__raw_offsets": 1964643,
               "agent.__stringDictionary": 6709,
               "app_version": 263,
               "app_version.__encodedColumn": 1990,
               "app_version.__stringDictionary": 31,
               "app_version.__valueIndexes": 143,
               "client_ip": 261,
               "client_ip.__encodedColumn": 881953,
               "client_ip.__stringDictionary": 453370,
               "client_ip.__valueIndexes": 1472563,
               "event": 397,
               "event.__arrayDictionary": 5,
               "event.__doubleDictionary": 6,
               "event.__field_0": 3850,
               "event.__field_1": 703821,
               "event.__field_2": 1532655,
               "event.__field_3": 2616,
               "event.__field_4": 324067,
               "event.__field_5": 13028,
               "event.__field_6": 2389,
               "event.__longDictionary": 206,
               "event.__raw": 5,
               "event.__raw_compressed": 956686,
               "event.__raw_offsets": 1886242,
               "event.__stringDictionary": 28152,
               "geo_ip": 345,
               "geo_ip.__arrayDictionary": 5,
               "geo_ip.__doubleDictionary": 6,
               "geo_ip.__field_0": 2013216,
               "geo_ip.__field_1": 371382,
               "geo_ip.__field_2": 703667,
               "geo_ip.__field_3": 1616086,
               "geo_ip.__longDictionary": 6,
               "geo_ip.__raw": 5,
               "geo_ip.__raw_compressed": 2702906,
               "geo_ip.__raw_offsets": 1926682,
               "geo_ip.__stringDictionary": 131017,
               "index.drd": 1014,
               "language": 267,
               "language.__arrayDictionary": 13756,
               "language.__arrayElementDictionary": 1058,
               "language.__arrayElementIndexes": 687920,
               "language.__doubleDictionary": 6,
               "language.__encodedColumn": 427315,
               "language.__longDictionary": 6,
               "language.__stringDictionary": 3901,
               "language.__valueIndexes": 582112,
               "loaded_image": 264,
               "loaded_image.__encodedColumn": 346277,
               "loaded_image.__stringDictionary": 1213,
               "loaded_image.__valueIndexes": 641720,
               "metadata.drd": 157,
               "number": 258,
               "number.__encodedColumn": 414753,
               "number.__stringDictionary": 328,
               "number.__valueIndexes": 873812,
               "path": 256,
               "path.__encodedColumn": 272509,
               "path.__stringDictionary": 233449,
               "path.__valueIndexes": 342106,
               "referrer": 260,
               "referrer.__encodedColumn": 291826,
               "referrer.__stringDictionary": 238389,
               "referrer.__valueIndexes": 339389,
               "referrer_host": 265,
               "referrer_host.__encodedColumn": 209113,
               "referrer_host.__stringDictionary": 3841,
               "referrer_host.__valueIndexes": 300381,
               "screen": 258,
               "screen.__encodedColumn": 452611,
               "screen.__stringDictionary": 5729,
               "screen.__valueIndexes": 718696,
               "server_ip": 261,
               "server_ip.__encodedColumn": 120352,
               "server_ip.__stringDictionary": 57,
               "server_ip.__valueIndexes": 127184,
               "session": 259,
               "session.__encodedColumn": 904806,
               "session.__stringDictionary": 888795,
               "session.__valueIndexes": 2192612,
               "session_length": 264,
               "session_length.__encodedColumn": 1382863,
               "session_length.__longColumn": 1804957,
               "session_length.__longDictionary": 1442790,
               "session_length.__valueIndexes": 6566614,
               "timezone": 260,
               "timezone.__encodedColumn": 176501,
               "timezone.__stringDictionary": 596,
               "timezone.__valueIndexes": 295425,
               "timezone_offset": 267,
               "timezone_offset.__encodedColumn": 270411,
               "timezone_offset.__stringDictionary": 363,
               "timezone_offset.__valueIndexes": 452374,
               "window": 258,
               "window.__encodedColumn": 737726,
               "window.__stringDictionary": 172969,
               "window.__valueIndexes": 1230794
           }
   ```


-- 
This is an automated message from the Apache Git Service.
To respond to the message, please log on to GitHub and use the
URL above to go to the specific comment.

To unsubscribe, e-mail: commits-unsubscr...@druid.apache.org

For queries about this service, please contact Infrastructure at:
us...@infra.apache.org


---------------------------------------------------------------------
To unsubscribe, e-mail: commits-unsubscr...@druid.apache.org
For additional commands, e-mail: commits-h...@druid.apache.org

Reply via email to