changeset 373:0ccc746c8079

Zachary Travis - Add support for the OST 2013 format, and Content-Disposition filename key fix for outlook compatibility
author Carl Byington <carl@five-ten-sg.com>
date Fri, 21 Jul 2017 20:01:44 -0700 (2017-07-22)
parents 5b52efe35bd8
children 62f05deb2e1c
files configure.in libpst.spec.in src/Makefile.am src/libpst.c src/libpst.h src/readpst.c
diffstat 6 files changed, 188 insertions(+), 60 deletions(-) [+]
line wrap: on
line diff
--- a/configure.in	Fri Jul 21 19:54:46 2017 -0700
+++ b/configure.in	Fri Jul 21 20:01:44 2017 -0700
@@ -377,6 +377,8 @@
 AC_SUBST(GSF_FLAGS, [$gsf_flags])
 AC_SUBST(GSF_LIBS, [$gsf_libs])
 
+PKG_CHECK_MODULES([ZLIB], [zlib])
+
 AC_OUTPUT(                  \
     Makefile                \
     html/Makefile           \
--- a/libpst.spec.in	Fri Jul 21 19:54:46 2017 -0700
+++ b/libpst.spec.in	Fri Jul 21 20:01:44 2017 -0700
@@ -182,8 +182,10 @@
 
 
 %changelog
-* Wed Feb 08 2017 Carl Byington <carl@five-ten-sg.com> 0.6.71-1
+* Fri Jul 21 2017 Carl Byington <carl@five-ten-sg.com> 0.6.71-1
 - fedora python naming scheme changes
+- Zachary Travis - Add support for the OST 2013 format, and
+  Content-Disposition filename key fix for outlook compatibility
 
 * Thu Jul 20 2017 Kalev Lember <klember@redhat.com> - 0.6.70-3
 - Rebuilt for Boost 1.64
--- a/src/Makefile.am	Fri Jul 21 19:54:46 2017 -0700
+++ b/src/Makefile.am	Fri Jul 21 20:01:44 2017 -0700
@@ -91,13 +91,13 @@
 INCLUDES= -I$(srcdir)/.. $(all_includes)
 
 # the library search path.
-lspst_LDADD       = $(all_libraries) $(PSTLIB) $(LTLIBICONV)
-readpst_LDADD     = $(all_libraries) $(PSTLIB) $(LTLIBICONV) $(REGEXLIB) $(GSF_LIBS)
-pst2ldif_LDADD    = $(all_libraries) $(PSTLIB) $(LTLIBICONV)
-pst2dii_LDADD     = $(all_libraries) $(PSTLIB) $(LTLIBICONV) -lgd
-deltasearch_LDADD = $(all_libraries) $(PSTLIB) $(LTLIBICONV)
-dumpblocks_LDADD  = $(all_libraries) $(PSTLIB) $(LTLIBICONV)
-getidblock_LDADD  = $(all_libraries) $(PSTLIB) $(LTLIBICONV)
-nick2ldif_LDADD   = $(all_libraries) $(PSTLIB) $(LTLIBICONV)
+lspst_LDADD       = $(all_libraries) $(PSTLIB) $(LTLIBICONV) @ZLIB_LIBS@
+readpst_LDADD     = $(all_libraries) $(PSTLIB) $(LTLIBICONV) $(REGEXLIB) $(GSF_LIBS) @ZLIB_LIBS@
+pst2ldif_LDADD    = $(all_libraries) $(PSTLIB) $(LTLIBICONV) @ZLIB_LIBS@
+pst2dii_LDADD     = $(all_libraries) $(PSTLIB) $(LTLIBICONV) -lgd @ZLIB_LIBS@
+deltasearch_LDADD = $(all_libraries) $(PSTLIB) $(LTLIBICONV) @ZLIB_LIBS@
+dumpblocks_LDADD  = $(all_libraries) $(PSTLIB) $(LTLIBICONV) @ZLIB_LIBS@
+getidblock_LDADD  = $(all_libraries) $(PSTLIB) $(LTLIBICONV) @ZLIB_LIBS@
+nick2ldif_LDADD   = $(all_libraries) $(PSTLIB) $(LTLIBICONV) @ZLIB_LIBS@
 
 
--- a/src/libpst.c	Fri Jul 21 19:54:46 2017 -0700
+++ b/src/libpst.c	Fri Jul 21 20:01:44 2017 -0700
@@ -6,6 +6,7 @@
  */
 
 #include "define.h"
+#include "zlib.h"
 
 
 // switch to maximal packing for our own internal structures
@@ -23,6 +24,7 @@
 #define INDEX_TYPE32A           0x0F    // unknown, but assumed to be similar for now
 #define INDEX_TYPE64            0x17
 #define INDEX_TYPE64A           0x15    // http://sourceforge.net/projects/libpff/
+#define INDEX_TYPE4K            0x24
 #define INDEX_TYPE_OFFSET       (int64_t)0x0A
 
 #define FILE_SIZE_POINTER32     (int64_t)0xA8
@@ -46,6 +48,7 @@
 #define SECOND_BACK       ((pf->do_read64) ? SECOND_BACK64       : SECOND_BACK32)
 #define ENC_TYPE          ((pf->do_read64) ? ENC_TYPE64          : ENC_TYPE32)
 
+
 #define PST_SIGNATURE 0x4E444221
 
 
@@ -135,10 +138,19 @@
 } pst_desc;
 
 
+typedef struct pst_index64 {
+    uint64_t id;
+    uint64_t offset;
+    uint16_t size;
+    int16_t  u0;
+    int32_t  u1;
+} pst_index64;
+
 typedef struct pst_index {
     uint64_t id;
     uint64_t offset;
     uint16_t size;
+    uint16_t inflated_size;
     int16_t  u0;
     int32_t  u1;
 } pst_index;
@@ -281,7 +293,8 @@
 static void             pst_printDptr(pst_file *pf, pst_desc_tree *ptr);
 static void             pst_printID2ptr(pst_id2_tree *ptr);
 static int              pst_process(uint64_t block_id, pst_mapi_object *list, pst_item *item, pst_item_attach *attach);
-static size_t           pst_read_block_size(pst_file *pf, int64_t offset, size_t size, char **buf);
+static size_t           pst_read_block_size(pst_file *pf, int64_t offset, size_t size, size_t inflated_size, char **buf);
+static size_t           pst_read_raw_block_size(pst_file *pf, int64_t offset, size_t size, char **buf);
 static int              pst_decrypt(uint64_t i_id, char *buf, size_t size, unsigned char type);
 static int              pst_strincmp(char *a, char *b, size_t x);
 static char*            pst_wide_to_single(char *wt, size_t size);
@@ -348,6 +361,9 @@
         case INDEX_TYPE64A :
             pf->do_read64 = 1;
             break;
+        case INDEX_TYPE4K :
+            pf->do_read64 = 2;
+            break;
         default:
             (void)fclose(pf->fp);
             DEBUG_WARN(("unknown .pst format, possibly newer than Outlook 2003 PST file?\n"));
@@ -807,31 +823,32 @@
 
 
 #define ITEM_COUNT_OFFSET32        0x1f0    // count byte
+#define MAX_COUNT_OFFSET32         0x1f1
+#define ENTRY_SIZE_OFFSET32        0x1f2
 #define LEVEL_INDICATOR_OFFSET32   0x1f3    // node or leaf
 #define BACKLINK_OFFSET32          0x1f8    // backlink u1 value
-#define ITEM_SIZE32                12
-#define DESC_SIZE32                16
-#define INDEX_COUNT_MAX32          41       // max active items
-#define DESC_COUNT_MAX32           31       // max active items
 
 #define ITEM_COUNT_OFFSET64        0x1e8    // count byte
+#define MAX_COUNT_OFFSET64         0x1e9
+#define ENTRY_SIZE_OFFSET64        0x1ea    // node or leaf
 #define LEVEL_INDICATOR_OFFSET64   0x1eb    // node or leaf
 #define BACKLINK_OFFSET64          0x1f8    // backlink u1 value
-#define ITEM_SIZE64                24
-#define DESC_SIZE64                32
-#define INDEX_COUNT_MAX64          20       // max active items
-#define DESC_COUNT_MAX64           15       // max active items
-
-#define BLOCK_SIZE                 512      // index blocks
-#define DESC_BLOCK_SIZE            512      // descriptor blocks
-#define ITEM_COUNT_OFFSET        (size_t)((pf->do_read64) ? ITEM_COUNT_OFFSET64      : ITEM_COUNT_OFFSET32)
-#define LEVEL_INDICATOR_OFFSET   (size_t)((pf->do_read64) ? LEVEL_INDICATOR_OFFSET64 : LEVEL_INDICATOR_OFFSET32)
-#define BACKLINK_OFFSET          (size_t)((pf->do_read64) ? BACKLINK_OFFSET64        : BACKLINK_OFFSET32)
-#define ITEM_SIZE                (size_t)((pf->do_read64) ? ITEM_SIZE64              : ITEM_SIZE32)
-#define DESC_SIZE                (size_t)((pf->do_read64) ? DESC_SIZE64              : DESC_SIZE32)
-#define INDEX_COUNT_MAX         (int32_t)((pf->do_read64) ? INDEX_COUNT_MAX64        : INDEX_COUNT_MAX32)
-#define DESC_COUNT_MAX          (int32_t)((pf->do_read64) ? DESC_COUNT_MAX64         : DESC_COUNT_MAX32)
-
+
+#define ITEM_COUNT_OFFSET4K        0xfd8
+#define MAX_COUNT_OFFSET4K         0xfda
+#define ENTRY_SIZE_OFFSET4K        0xfdc
+#define LEVEL_INDICATOR_OFFSET4K   0xfdd
+#define BACKLINK_OFFSET4K          0xff0
+
+#define BLOCK_SIZE               (size_t)((pf->do_read64 == 2) ? 4096 : 512)      // index blocks
+#define DESC_BLOCK_SIZE          (size_t)((pf->do_read64 == 2) ? 4096 : 512)      // descriptor blocks
+#define ITEM_COUNT_OFFSET        (size_t)((pf->do_read64) ? (pf->do_read64 == 2 ? ITEM_COUNT_OFFSET4K : ITEM_COUNT_OFFSET64) : ITEM_COUNT_OFFSET32)
+#define LEVEL_INDICATOR_OFFSET   (size_t)((pf->do_read64) ? (pf->do_read64 == 2 ? LEVEL_INDICATOR_OFFSET4K : LEVEL_INDICATOR_OFFSET64) : LEVEL_INDICATOR_OFFSET32)
+#define BACKLINK_OFFSET          (size_t)((pf->do_read64) ? (pf->do_read64 == 2 ? BACKLINK_OFFSET4K : BACKLINK_OFFSET64) : BACKLINK_OFFSET32)
+#define ENTRY_SIZE_OFFSET        (size_t)((pf->do_read64) ? (pf->do_read64 == 2 ? ENTRY_SIZE_OFFSET4K : ENTRY_SIZE_OFFSET64) : ENTRY_SIZE_OFFSET32)
+#define MAX_COUNT_OFFSET         (size_t)((pf->do_read64) ? (pf->do_read64 == 2 ? MAX_COUNT_OFFSET4K : MAX_COUNT_OFFSET64) : MAX_COUNT_OFFSET32)
+
+#define read_twobyte(BUF, OFF)   (int32_t) ((((unsigned)BUF[OFF + 1] & 0xFF)) << 8) | ((unsigned)BUF[OFF] & 0xFF);
 
 static size_t pst_decode_desc(pst_file *pf, pst_desc *desc, char *buf);
 static size_t pst_decode_desc(pst_file *pf, pst_desc *desc, char *buf) {
@@ -899,16 +916,34 @@
 static size_t pst_decode_index(pst_file *pf, pst_index *index, char *buf);
 static size_t pst_decode_index(pst_file *pf, pst_index *index, char *buf) {
     size_t r;
-    if (pf->do_read64) {
-        DEBUG_INFO(("Decoding index64\n"));
+    if (pf->do_read64 == 2) {
+        DEBUG_INFO(("Decoding index4k\n"));
         DEBUG_HEXDUMPC(buf, sizeof(pst_index), 0x10);
         memcpy(index, buf, sizeof(pst_index));
         LE64_CPU(index->id);
         LE64_CPU(index->offset);
         LE16_CPU(index->size);
+        LE16_CPU(index->inflated_size);
         LE16_CPU(index->u0);
         LE32_CPU(index->u1);
         r = sizeof(pst_index);
+    } else  if (pf->do_read64 == 1) {
+        pst_index64 index64;
+        DEBUG_INFO(("Decoding index64\n"));
+        DEBUG_HEXDUMPC(buf, sizeof(pst_index64), 0x10);
+        memcpy(&index64, buf, sizeof(pst_index64));
+        LE64_CPU(index64.id);
+        LE64_CPU(index64.offset);
+        LE16_CPU(index64.size);
+        LE16_CPU(index64.u0);
+        LE32_CPU(index64.u1);
+        index->id     = index64.id;
+        index->offset = index64.offset;
+        index->size   = index64.size;
+        index->inflated_size = index64.size;
+        index->u0     = index64.u0;
+        index->u1     = index64.u1;
+        r = sizeof(pst_index64);
     } else {
         pst_index32 index32;
         DEBUG_INFO(("Decoding index32\n"));
@@ -921,6 +956,7 @@
         index->id     = index32.id;
         index->offset = index32.offset;
         index->size   = index32.size;
+        index->inflated_size = index32.size;
         index->u0     = 0;
         index->u1     = index32.u1;
         r = sizeof(pst_index32);
@@ -990,7 +1026,7 @@
     struct pst_table_ptr_struct table, table2;
     pst_index_ll *i_ptr=NULL;
     pst_index index;
-    int32_t x, item_count;
+    int32_t x, item_count, count_max;
     uint64_t old = start_val;
     char *buf = NULL, *bptr;
 
@@ -1002,17 +1038,23 @@
         return -1;
     }
     DEBUG_INFO(("Reading index block\n"));
-    if (pst_read_block_size(pf, offset, BLOCK_SIZE, &buf) < BLOCK_SIZE) {
+    if (pst_read_block_size(pf, offset, BLOCK_SIZE, BLOCK_SIZE, &buf) < BLOCK_SIZE) {
         DEBUG_WARN(("Failed to read %i bytes\n", BLOCK_SIZE));
         if (buf) free(buf);
         DEBUG_RET();
         return -1;
     }
     bptr = buf;
-    DEBUG_HEXDUMPC(buf, BLOCK_SIZE, ITEM_SIZE32);
-    item_count = (int32_t)(unsigned)(buf[ITEM_COUNT_OFFSET]);
-    if (item_count > INDEX_COUNT_MAX) {
-        DEBUG_WARN(("Item count %i too large, max is %i\n", item_count, INDEX_COUNT_MAX));
+    DEBUG_HEXDUMPC(buf, BLOCK_SIZE, 0x10);
+    if (pf->do_read64 == 2) {
+        item_count = read_twobyte(buf, ITEM_COUNT_OFFSET);
+        count_max = read_twobyte(buf, MAX_COUNT_OFFSET);
+    } else {
+        item_count = (int32_t)(unsigned)(buf[ITEM_COUNT_OFFSET]);
+        count_max = (int32_t)(unsigned)(buf[MAX_COUNT_OFFSET]);
+    }
+    if (item_count > count_max) {
+        DEBUG_WARN(("Item count %i too large, max is %i\n", item_count, count_max));
         if (buf) free(buf);
         DEBUG_RET();
         return -1;
@@ -1024,12 +1066,14 @@
         DEBUG_RET();
         return -1;
     }
-
+    int entry_size = (int32_t)(unsigned)(buf[ENTRY_SIZE_OFFSET]);
+    DEBUG_INFO(("count %#"PRIx64" max %#"PRIx64" size %#"PRIx64"\n", item_count, count_max, entry_size));
     if (buf[LEVEL_INDICATOR_OFFSET] == '\0') {
         // this node contains leaf pointers
         x = 0;
         while (x < item_count) {
-            bptr += pst_decode_index(pf, &index, bptr);
+            pst_decode_index(pf, &index, bptr);
+            bptr += entry_size;
             x++;
             if (index.id == 0) break;
             DEBUG_INFO(("[%i]%i Item [id = %#"PRIx64", offset = %#"PRIx64", u1 = %#x, size = %i(%#x)]\n",
@@ -1051,12 +1095,14 @@
             i_ptr->offset = index.offset;
             i_ptr->u1     = index.u1;
             i_ptr->size   = index.size;
+            i_ptr->inflated_size = index.inflated_size;
         }
     } else {
         // this node contains node pointers
         x = 0;
         while (x < item_count) {
-            bptr += pst_decode_table(pf, &table, bptr);
+            pst_decode_table(pf, &table, bptr);
+            bptr += entry_size;
             x++;
             if (table.start == 0) break;
             if (x < item_count) {
@@ -1090,7 +1136,7 @@
 static int pst_build_desc_ptr (pst_file *pf, int64_t offset, int32_t depth, uint64_t linku1, uint64_t start_val, uint64_t end_val) {
     struct pst_table_ptr_struct table, table2;
     pst_desc desc_rec;
-    int32_t item_count;
+    int32_t item_count, count_max;
     uint64_t old = start_val;
     int x;
     char *buf = NULL, *bptr;
@@ -1103,15 +1149,20 @@
         return -1;
     }
     DEBUG_INFO(("Reading desc block\n"));
-    if (pst_read_block_size(pf, offset, DESC_BLOCK_SIZE, &buf) < DESC_BLOCK_SIZE) {
+    if (pst_read_block_size(pf, offset, DESC_BLOCK_SIZE, DESC_BLOCK_SIZE, &buf) < DESC_BLOCK_SIZE) {
         DEBUG_WARN(("Failed to read %i bytes\n", DESC_BLOCK_SIZE));
         if (buf) free(buf);
         DEBUG_RET();
         return -1;
     }
     bptr = buf;
-    item_count = (int32_t)(unsigned)(buf[ITEM_COUNT_OFFSET]);
-
+    if (pf->do_read64 == 2) {
+        item_count = read_twobyte(buf, ITEM_COUNT_OFFSET);
+        count_max = read_twobyte(buf, MAX_COUNT_OFFSET);
+    } else {
+        item_count = (int32_t)(unsigned)(buf[ITEM_COUNT_OFFSET]);
+        count_max = (int32_t)(unsigned)(buf[MAX_COUNT_OFFSET]);
+    }
     desc_rec.d_id = pst_getIntAt(pf, buf+BACKLINK_OFFSET);
     if (desc_rec.d_id != linku1) {
         DEBUG_WARN(("Backlink %#"PRIx64" in this node does not match required %#"PRIx64"\n", desc_rec.d_id, linku1));
@@ -1119,17 +1170,19 @@
         DEBUG_RET();
         return -1;
     }
+    int32_t entry_size = (int32_t)(unsigned)(buf[ENTRY_SIZE_OFFSET]);
     if (buf[LEVEL_INDICATOR_OFFSET] == '\0') {
         // this node contains leaf pointers
-        DEBUG_HEXDUMPC(buf, DESC_BLOCK_SIZE, DESC_SIZE32);
-        if (item_count > DESC_COUNT_MAX) {
-            DEBUG_WARN(("Item count %i too large, max is %i\n", item_count, DESC_COUNT_MAX));
+        DEBUG_HEXDUMPC(buf, DESC_BLOCK_SIZE, entry_size);
+        if (item_count > count_max) {
+            DEBUG_WARN(("Item count %i too large, max is %i\n", item_count, count_max));
             if (buf) free(buf);
             DEBUG_RET();
             return -1;
         }
         for (x=0; x<item_count; x++) {
-            bptr += pst_decode_desc(pf, &desc_rec, bptr);
+            pst_decode_desc(pf, &desc_rec, bptr);
+            bptr += entry_size;
             DEBUG_INFO(("[%i] Item(%#x) = [d_id = %#"PRIx64", desc_id = %#"PRIx64", tree_id = %#"PRIx64", parent_d_id = %#x]\n",
                         depth, x, desc_rec.d_id, desc_rec.desc_id, desc_rec.tree_id, desc_rec.parent_d_id));
             if ((desc_rec.d_id >= end_val) || (desc_rec.d_id < old)) {
@@ -1152,15 +1205,16 @@
         }
     } else {
         // this node contains node pointers
-        DEBUG_HEXDUMPC(buf, DESC_BLOCK_SIZE, ITEM_SIZE32);
-        if (item_count > INDEX_COUNT_MAX) {
-            DEBUG_WARN(("Item count %i too large, max is %i\n", item_count, INDEX_COUNT_MAX));
+        DEBUG_HEXDUMPC(buf, DESC_BLOCK_SIZE, entry_size);
+        if (item_count > count_max) {
+            DEBUG_WARN(("Item count %i too large, max is %i\n", item_count, count_max));
             if (buf) free(buf);
             DEBUG_RET();
             return -1;
         }
         for (x=0; x<item_count; x++) {
-            bptr += pst_decode_table(pf, &table, bptr);
+            pst_decode_table(pf, &table, bptr);
+            bptr += entry_size;
             if (table.start == 0) break;
             if (x < (item_count-1)) {
                 (void)pst_decode_table(pf, &table2, bptr);
@@ -3246,7 +3300,7 @@
     pst_id2_tree *i2_ptr = NULL;
     DEBUG_ENT("pst_build_id2");
 
-    if (pst_read_block_size(pf, list->offset, list->size, &buf) < list->size) {
+    if (pst_read_block_size(pf, list->offset, list->size, list->inflated_size, &buf) < list->size) {
         //an error occured in block read
         DEBUG_WARN(("block read error occured. offset = %#"PRIx64", size = %#"PRIx64"\n", list->offset, list->size));
         if (buf) free(buf);
@@ -3277,7 +3331,7 @@
             DEBUG_WARN(("%#"PRIx64" - Not Found\n", id2_rec.id));
         } else {
             DEBUG_INFO(("%#"PRIx64" - Offset %#"PRIx64", u1 %#"PRIx64", Size %"PRIi64"(%#"PRIx64")\n",
-                         i_ptr->i_id, i_ptr->offset, i_ptr->u1, i_ptr->size, i_ptr->size));
+                         i_ptr->i_id, i_ptr->offset, i_ptr->u1, i_ptr->size, i_ptr->inflated_size));
             // add it to the tree
             i2_ptr = (pst_id2_tree*) pst_malloc(sizeof(pst_id2_tree));
             i2_ptr->id2   = id2_rec.id2;
@@ -3564,8 +3618,13 @@
         }
     }
     else {
+        DEBUG_WARN(("Found internal %#x value.\n", offset));
         // internal index reference
         size_t subindex  = offset >> 16;
+        if (pf->do_read64 == 2) {
+            // Shift over 3 more bits for new flags.
+            subindex = subindex >> 3;
+        }
         size_t suboffset = offset & 0xffff;
         if (subindex < subblocks->subblock_count) {
             if (pst_getBlockOffset(subblocks->subs[subindex].buf,
@@ -3720,10 +3779,10 @@
                  is non-NULL, it will first be free()d
  * @return       size of block read into memory
  */
-static size_t pst_read_block_size(pst_file *pf, int64_t offset, size_t size, char **buf) {
+static size_t pst_read_raw_block_size(pst_file *pf, int64_t offset, size_t size, char **buf) {
     size_t rsize;
-    DEBUG_ENT("pst_read_block_size");
-    DEBUG_INFO(("Reading block from %#"PRIx64", %x bytes\n", offset, size));
+    DEBUG_ENT("pst_read_raw_block_size");
+    DEBUG_INFO(("Reading raw block from %#"PRIx64", %x bytes\n", offset, size));
 
     if (*buf) {
         DEBUG_INFO(("Freeing old memory\n"));
@@ -3747,6 +3806,36 @@
     return rsize;
 }
 
+static size_t pst_read_block_size(pst_file *pf, int64_t offset, size_t size, size_t inflated_size, char **buf) {
+    DEBUG_ENT("pst_read_block_size");
+    DEBUG_INFO(("Reading block from %#"PRIx64", %x bytes, %x inflated\n", offset, size, inflated_size));
+    if (inflated_size <= size) {
+        // Not deflated.
+        size_t ret = pst_read_raw_block_size(pf, offset, size, buf);
+        DEBUG_RET();
+        return ret;
+    }
+    // We need to read the raw block and inflate it.
+    char *zbuf = NULL;
+    if (pst_read_raw_block_size(pf, offset, size, &zbuf) != size) {
+        DEBUG_WARN(("Failed to read %i bytes\n", size));
+        if (zbuf) free(zbuf);
+        DEBUG_RET();
+        return -1;
+    }
+    *buf = (char *) pst_malloc(inflated_size);
+    size_t result_size = inflated_size;
+    if (uncompress((Bytef *) *buf, &result_size, (Bytef *) zbuf, size) != Z_OK || result_size != inflated_size) {
+        DEBUG_WARN(("Failed to uncompress %i bytes to %i bytes, got %i\n", size, inflated_size, result_size));
+        if (zbuf) free(zbuf);
+        DEBUG_RET();
+        return -1;
+    }
+    DEBUG_RET();
+    return inflated_size;
+}
+
+
 
 /** Decrypt a block of data from the pst file.
  * @param i_id identifier of this block, needed as part of the key for the enigma cipher
@@ -3923,7 +4012,7 @@
         return 0;
     }
     DEBUG_INFO(("id = %#"PRIx64", record size = %#x, offset = %#x\n", i_id, rec->size, rec->offset));
-    rsize = pst_read_block_size(pf, rec->offset, rec->size, buf);
+    rsize = pst_read_block_size(pf, rec->offset, rec->size, rec->inflated_size, buf);
     DEBUG_RET();
     return rsize;
 }
--- a/src/libpst.h	Fri Jul 21 19:54:46 2017 -0700
+++ b/src/libpst.h	Fri Jul 21 20:01:44 2017 -0700
@@ -105,6 +105,7 @@
     uint64_t i_id;
     uint64_t offset;
     uint64_t size;
+    uint64_t inflated_size;
     int64_t  u1;
 } pst_index_ll;
 
@@ -907,7 +908,8 @@
     pst_block_recorder *block_head;
 
     /** @li 0 is 32-bit pst file, pre Outlook 2003;
-     *  @li 1 is 64-bit pst file, Outlook 2003 or later */
+     *  @li 1 is 64-bit pst file, Outlook 2003 or later;
+     *  @li 2 is 64-bit OST file, Outlook 2013 or later */
     int do_read64;
     /** file offset of the first b-tree node in the index tree */
     uint64_t index1;
--- a/src/readpst.c	Fri Jul 21 19:54:46 2017 -0700
+++ b/src/readpst.c	Fri Jul 21 20:01:44 2017 -0700
@@ -66,6 +66,7 @@
 void      write_appointment(FILE* f_output, pst_item *item);
 void      create_enter_dir(struct file_ll* f, pst_item *item);
 void      close_enter_dir(struct file_ll *f);
+char*     quote_string(char *inp);
 
 const char*  prog_name;
 char*  output_dir = ".";
@@ -1151,6 +1152,32 @@
     DEBUG_RET();
 }
 
+/**
+ * Backslash-escape quotes and backslashes in the given string.
+ */
+char *quote_string(char *inp) {
+    int i = 0;
+    int count = 0;
+    char *curr = inp;
+    while (*curr) {
+        *curr++;
+        if (*curr == '\"' || *curr == '\\') {
+            count++;
+        }
+        i++;
+    }
+    char *res = malloc(i + count + 1);
+    char *curr_in = inp;
+    char *curr_out = res;
+    while (*curr_in) {
+        if (*curr_in == '\"' || *curr_in == '\\') {
+            *curr_out++ = '\\';
+        }
+        *curr_out++ = *curr_in++;
+    }
+    *curr_out = '\0';
+    return res;
+}
 
 void write_inline_attachment(FILE* f_output, pst_item_attach* attach, char *boundary, pst_file* pst)
 {
@@ -1182,8 +1209,14 @@
     if (attach->filename2.str) {
         // use the long filename, converted to proper encoding if needed.
         // it is already utf8
+        char *escaped = quote_string(attach->filename2.str);
         pst_rfc2231(&attach->filename2);
-        fprintf(f_output, "Content-Disposition: attachment; \n        filename*=%s\n\n", attach->filename2.str);
+        fprintf(f_output, "Content-Disposition: attachment; \n        filename*=%s;\n", attach->filename2.str);
+        // Also include the (escaped) utf8 filename in the 'filename' header directly - this is not strictly valid
+        // (since this header should be ASCII) but is almost always handled correctly (and in fact this is the only
+        // way to get MS Outlook to correctly read a UTF8 filename, AFAICT, which is why we're doing it).
+        fprintf(f_output, "        filename=\"%s\"\n\n", escaped);
+        free(escaped);
     }
     else if (attach->filename1.str) {
         // short filename never needs encoding