apache 1.3 KB

1234567891011121314151617181920212223242526272829303132333435363738
  1. #------------------------------------------------------------------------------
  2. # $File: apache,v 1.3 2025/05/30 13:25:13 christos Exp $
  3. # apache: file(1) magic for Apache Big Data formats
  4. # Avro files
  5. 0 string Obj\001 Apache Avro, version 1
  6. # ORC files
  7. # Important information is in file footer, which we can't index to :(
  8. 0 string ORC Apache ORC
  9. # Apache arrow file format
  10. # MIME: https://www.iana.org/assignments/media-types/application/vnd.apache.arrow.stream
  11. # Description: https://arrow.apache.org/docs/format/Columnar.html
  12. 0 string ARROW1 Apache Arrow columnar file
  13. !:mime application/vnd.apache.arrow.file
  14. !:ext arrow/feather
  15. # Apache parquet file format
  16. # MIME: https://www.iana.org/assignments/media-types/application/vnd.apache.parquet
  17. # Description: https://parquet.apache.org/docs/file-format/
  18. 0 string PAR1 Apache Parquet file
  19. !:mime application/vnd.apache.parquet
  20. !:ext parquet
  21. # Hive RC files
  22. 0 string RCF Apache Hive RC file
  23. >3 byte x version %d
  24. # Sequence files (and the careless first version of RC file)
  25. 0 string SEQ
  26. >3 byte <6 Apache Hadoop Sequence file version %d
  27. >3 byte >6 Apache Hadoop Sequence file version %d
  28. >3 byte =6
  29. >>5 string org.apache.hadoop.hive.ql.io.RCFile$KeyBuffer Apache Hive RC file version 0
  30. >>3 default x Apache Hadoop Sequence file version 6