| 1 | //===- AutoConvert.cpp - Auto conversion between ASCII/EBCDIC -------------===// | 
|---|
| 2 | // | 
|---|
| 3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. | 
|---|
| 4 | // See https://llvm.org/LICENSE.txt for license information. | 
|---|
| 5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception | 
|---|
| 6 | // | 
|---|
| 7 | //===----------------------------------------------------------------------===// | 
|---|
| 8 | // | 
|---|
| 9 | // This file contains functions used for auto conversion between | 
|---|
| 10 | // ASCII/EBCDIC codepages specific to z/OS. | 
|---|
| 11 | // | 
|---|
| 12 | //===----------------------------------------------------------------------===// | 
|---|
| 13 |  | 
|---|
| 14 | #ifdef __MVS__ | 
|---|
| 15 |  | 
|---|
| 16 | #include "llvm/Support/AutoConvert.h" | 
|---|
| 17 | #include <cassert> | 
|---|
| 18 | #include <fcntl.h> | 
|---|
| 19 | #include <sys/stat.h> | 
|---|
| 20 | #include <unistd.h> | 
|---|
| 21 |  | 
|---|
| 22 | using namespace llvm; | 
|---|
| 23 |  | 
|---|
| 24 | static int savedStdHandleAutoConversionMode[3] = {-1, -1, -1}; | 
|---|
| 25 |  | 
|---|
| 26 | int disablezOSAutoConversion(int FD) { | 
|---|
| 27 | static const struct f_cnvrt Convert = { | 
|---|
| 28 | SETCVTOFF, // cvtcmd | 
|---|
| 29 | 0,         // pccsid | 
|---|
| 30 | 0,         // fccsid | 
|---|
| 31 | }; | 
|---|
| 32 |  | 
|---|
| 33 | return fcntl(FD, F_CONTROL_CVT, &Convert); | 
|---|
| 34 | } | 
|---|
| 35 |  | 
|---|
| 36 | int restorezOSStdHandleAutoConversion(int FD) { | 
|---|
| 37 | assert(FD == STDIN_FILENO || FD == STDOUT_FILENO || FD == STDERR_FILENO); | 
|---|
| 38 | if (savedStdHandleAutoConversionMode[FD] == -1) | 
|---|
| 39 | return 0; | 
|---|
| 40 | struct f_cnvrt Cvt = { | 
|---|
| 41 | savedStdHandleAutoConversionMode[FD], // cvtcmd | 
|---|
| 42 | 0,                                    // pccsid | 
|---|
| 43 | 0,                                    // fccsid | 
|---|
| 44 | }; | 
|---|
| 45 | return (fcntl(FD, F_CONTROL_CVT, &Cvt)); | 
|---|
| 46 | } | 
|---|
| 47 |  | 
|---|
| 48 | int enablezOSAutoConversion(int FD) { | 
|---|
| 49 | struct f_cnvrt Query = { | 
|---|
| 50 | QUERYCVT, // cvtcmd | 
|---|
| 51 | 0,        // pccsid | 
|---|
| 52 | 0,        // fccsid | 
|---|
| 53 | }; | 
|---|
| 54 |  | 
|---|
| 55 | if (fcntl(FD, F_CONTROL_CVT, &Query) == -1) | 
|---|
| 56 | return -1; | 
|---|
| 57 |  | 
|---|
| 58 | // We don't need conversion for UTF-8 tagged files. | 
|---|
| 59 | // TODO: Remove the assumption of ISO8859-1 = UTF-8 here when we fully resolve | 
|---|
| 60 | // problems related to UTF-8 tagged source files. | 
|---|
| 61 | // When the pccsid is not ISO8859-1, autoconversion is still needed. | 
|---|
| 62 | if (Query.pccsid == CCSID_ISO8859_1 && | 
|---|
| 63 | (Query.fccsid == CCSID_UTF_8 || Query.fccsid == CCSID_ISO8859_1)) | 
|---|
| 64 | return 0; | 
|---|
| 65 |  | 
|---|
| 66 | // Save the state of std handles before we make changes to it. | 
|---|
| 67 | if ((FD == STDIN_FILENO || FD == STDOUT_FILENO || FD == STDERR_FILENO) && | 
|---|
| 68 | savedStdHandleAutoConversionMode[FD] == -1) | 
|---|
| 69 | savedStdHandleAutoConversionMode[FD] = Query.cvtcmd; | 
|---|
| 70 |  | 
|---|
| 71 | if (FD == STDOUT_FILENO || FD == STDERR_FILENO) | 
|---|
| 72 | Query.cvtcmd = SETCVTON; | 
|---|
| 73 | else | 
|---|
| 74 | Query.cvtcmd = SETCVTALL; | 
|---|
| 75 |  | 
|---|
| 76 | Query.pccsid = | 
|---|
| 77 | (FD == STDIN_FILENO || FD == STDOUT_FILENO || FD == STDERR_FILENO) | 
|---|
| 78 | ? 0 | 
|---|
| 79 | : CCSID_UTF_8; | 
|---|
| 80 | // Assume untagged files to be IBM-1047 encoded. | 
|---|
| 81 | Query.fccsid = (Query.fccsid == FT_UNTAGGED) ? CCSID_IBM_1047 : Query.fccsid; | 
|---|
| 82 | return fcntl(FD, F_CONTROL_CVT, &Query); | 
|---|
| 83 | } | 
|---|
| 84 |  | 
|---|
| 85 | std::error_code llvm::setzOSFileTag(int FD, int CCSID, bool Text) { | 
|---|
| 86 | assert((!Text || (CCSID != FT_UNTAGGED && CCSID != FT_BINARY)) && | 
|---|
| 87 | "FT_UNTAGGED and FT_BINARY are not allowed for text files"); | 
|---|
| 88 | struct file_tag Tag; | 
|---|
| 89 | Tag.ft_ccsid = CCSID; | 
|---|
| 90 | Tag.ft_txtflag = Text; | 
|---|
| 91 | Tag.ft_deferred = 0; | 
|---|
| 92 | Tag.ft_rsvflags = 0; | 
|---|
| 93 |  | 
|---|
| 94 | if (fcntl(FD, F_SETTAG, &Tag) == -1) | 
|---|
| 95 | return errnoAsErrorCode(); | 
|---|
| 96 | return std::error_code(); | 
|---|
| 97 | } | 
|---|
| 98 |  | 
|---|
| 99 | ErrorOr<__ccsid_t> llvm::getzOSFileTag(const char *FileName, const int FD) { | 
|---|
| 100 | // If we have a file descriptor, use it to find out file tagging. Otherwise we | 
|---|
| 101 | // need to use stat() with the file path. | 
|---|
| 102 | if (FD != -1) { | 
|---|
| 103 | struct f_cnvrt Query = { | 
|---|
| 104 | QUERYCVT, // cvtcmd | 
|---|
| 105 | 0,        // pccsid | 
|---|
| 106 | 0,        // fccsid | 
|---|
| 107 | }; | 
|---|
| 108 | if (fcntl(FD, F_CONTROL_CVT, &Query) == -1) | 
|---|
| 109 | return std::error_code(errno, std::generic_category()); | 
|---|
| 110 | return Query.fccsid; | 
|---|
| 111 | } | 
|---|
| 112 | struct stat Attr; | 
|---|
| 113 | if (stat(FileName, &Attr) == -1) | 
|---|
| 114 | return std::error_code(errno, std::generic_category()); | 
|---|
| 115 | return Attr.st_tag.ft_ccsid; | 
|---|
| 116 | } | 
|---|
| 117 |  | 
|---|
| 118 | ErrorOr<bool> llvm::needzOSConversion(const char *FileName, const int FD) { | 
|---|
| 119 | ErrorOr<__ccsid_t> Ccsid = getzOSFileTag(FileName, FD); | 
|---|
| 120 | if (std::error_code EC = Ccsid.getError()) | 
|---|
| 121 | return EC; | 
|---|
| 122 | // We don't need conversion for UTF-8 tagged files or binary files. | 
|---|
| 123 | // TODO: Remove the assumption of ISO8859-1 = UTF-8 here when we fully resolve | 
|---|
| 124 | // problems related to UTF-8 tagged source files. | 
|---|
| 125 | switch (*Ccsid) { | 
|---|
| 126 | case CCSID_UTF_8: | 
|---|
| 127 | case CCSID_ISO8859_1: | 
|---|
| 128 | case FT_BINARY: | 
|---|
| 129 | return false; | 
|---|
| 130 | default: | 
|---|
| 131 | return true; | 
|---|
| 132 | } | 
|---|
| 133 | } | 
|---|
| 134 |  | 
|---|
| 135 | #endif //__MVS__ | 
|---|
| 136 |  | 
|---|