You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

unpack_ooxml.sh 1.4KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445
  1. #!/bin/bash -e
  2. #
  3. # Licensed to the Apache Software Foundation (ASF) under one or more
  4. # contributor license agreements. See the NOTICE file distributed with
  5. # this work for additional information regarding copyright ownership.
  6. # The ASF licenses this file to You under the Apache License, Version 2.0
  7. # (the "License"); you may not use this file except in compliance with
  8. # the License. You may obtain a copy of the License at
  9. #
  10. # http://www.apache.org/licenses/LICENSE-2.0
  11. #
  12. # Unless required by applicable law or agreed to in writing, software
  13. # distributed under the License is distributed on an "AS IS" BASIS,
  14. # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  15. # See the License for the specific language governing permissions and
  16. # limitations under the License.
  17. # basename it
  18. FILENAME="$1"
  19. BASENAME="${FILENAME##*/}"
  20. OUTDIR="${BASENAME%.*}"
  21. if [ ! -f "$FILENAME" ]; then
  22. echo "File $FILENAME does not exist"
  23. exit 1
  24. fi
  25. # if dir exists, fail
  26. if [ -d "$OUTDIR" ]; then
  27. echo "Directory '$OUTDIR' already exists!"
  28. exit 1
  29. fi
  30. mkdir "$OUTDIR"
  31. unzip -d "$OUTDIR" "$FILENAME"
  32. pushd "$OUTDIR"
  33. find . -type f \( -iname "*.xml" -or -iname "*.rels" \) -exec python -c "import os, sys, xml.dom.minidom
  34. with open('{}', 'r') as fp:
  35. s = fp.read()
  36. with open('{}.bak', 'w') as fp:
  37. fp.write(xml.dom.minidom.parseString(s).toprettyxml().encode('utf-8'))
  38. os.rename('{}.bak', '{}')" \;